docling/tests/data/groundtruth/docling_v1/2203.01017v2.pages.json
Christoph Auer e00f362405
Some checks failed
Run Docs CI / build-docs (push) Failing after 1m26s
Run CI / code-checks (push) Failing after 6m37s
Update tests, use TextCell.from_ocr property
Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-03-13 16:04:08 +01:00

1 line
1.4 MiB

[{"page_no": 0, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.918, "r_y0": 171.21699999999998, "r_x1": 332.306, "r_y1": 171.21699999999998, "r_x2": 332.306, "r_y2": 160.95500000000004, "r_x3": 262.918, "r_y3": 160.95500000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 261.938, "r_x1": 130.062, "r_y1": 261.938, "r_x2": 130.062, "r_y2": 253.35000000000002, "r_x3": 50.112, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "pact representation.", "orig": "pact representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.475, "r_y0": 261.938, "r_x1": 286.365, "r_y1": 261.938, "r_x2": 286.365, "r_y2": 253.35000000000002, "r_x3": 134.475, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "This content is extremely valuable for", "orig": "This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 273.89300000000003, "r_x1": 286.365, "r_y1": 273.89300000000003, "r_x2": 286.365, "r_y2": 265.30499999999995, "r_x3": 50.112, "r_y3": 265.30499999999995, "coord_origin": "TOPLEFT"}, "text": "systems such as search engines, Knowledge Graph's, etc,", "orig": "systems such as search engines, Knowledge Graph's, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 285.849, "r_x1": 245.18, "r_y1": 285.849, "r_x2": 245.18, "r_y2": 277.26099999999997, "r_x3": 50.112, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "since they enhance their predictive capabilities.", "orig": "since they enhance their predictive capabilities.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.496, "r_y0": 285.849, "r_x1": 286.365, "r_y1": 285.849, "r_x2": 286.365, "r_y2": 277.26099999999997, "r_x3": 251.496, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "Unfortu-", "orig": "Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 297.804, "r_x1": 286.365, "r_y1": 297.804, "r_x2": 286.365, "r_y2": 289.216, "r_x3": 50.112, "r_y3": 289.216, "coord_origin": "TOPLEFT"}, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 309.759, "r_x1": 103.601, "r_y1": 309.759, "r_x2": 103.601, "r_y2": 301.171, "r_x3": 50.112, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 108.393, "r_y0": 309.759, "r_x1": 124.692, "r_y1": 309.759, "r_x2": 124.692, "r_y2": 301.171, "r_x3": 108.393, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "they", "orig": "they", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.026, "r_y0": 309.759, "r_x1": 286.365, "r_y1": 309.759, "r_x2": 286.365, "r_y2": 301.171, "r_x3": 129.026, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "can have complex column/row-header", "orig": "can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 321.714, "r_x1": 286.365, "r_y1": 321.714, "r_x2": 286.365, "r_y2": 313.126, "r_x3": 50.112, "r_y3": 313.126, "coord_origin": "TOPLEFT"}, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 333.669, "r_x1": 175.123, "r_y1": 333.669, "r_x2": 175.123, "r_y2": 325.081, "r_x3": 50.112, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "tion lines, missing entries, etc.", "orig": "tion lines, missing entries, etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.931, "r_y0": 333.669, "r_x1": 286.365, "r_y1": 333.669, "r_x2": 286.365, "r_y2": 325.081, "r_x3": 180.931, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "As such, the correct iden-", "orig": "As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 345.624, "r_x1": 85.539, "r_y1": 345.624, "r_x2": 85.539, "r_y2": 337.036, "r_x3": 50.112, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "tification", "orig": "tification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.942, "r_y0": 345.624, "r_x1": 97.693, "r_y1": 345.624, "r_x2": 97.693, "r_y2": 337.036, "r_x3": 89.942, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.107, "r_y0": 345.624, "r_x1": 114.281, "r_y1": 345.624, "r_x2": 114.281, "r_y2": 337.036, "r_x3": 102.107, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.695, "r_y0": 345.624, "r_x1": 177.534, "r_y1": 345.624, "r_x2": 177.534, "r_y2": 337.036, "r_x3": 118.695, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 345.624, "r_x1": 286.365, "r_y1": 345.624, "r_x2": 286.365, "r_y2": 337.036, "r_x3": 181.947, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "from an image is a non-", "orig": "from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 357.58, "r_x1": 95.791, "r_y1": 357.58, "r_x2": 95.791, "r_y2": 348.992, "r_x3": 50.112, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "trivial task.", "orig": "trivial task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 99.746, "r_y0": 357.58, "r_x1": 286.365, "r_y1": 357.58, "r_x2": 286.365, "r_y2": 348.992, "r_x3": 99.746, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "In this paper, we present a new table-structure", "orig": "In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 369.535, "r_x1": 132.443, "r_y1": 369.535, "r_x2": 132.443, "r_y2": 360.947, "r_x3": 50.112, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "identification model.", "orig": "identification model.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.777, "r_y0": 369.535, "r_x1": 286.365, "r_y1": 369.535, "r_x2": 286.365, "r_y2": 360.947, "r_x3": 136.777, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "The latter improves the latest end-to-", "orig": "The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 381.49, "r_x1": 170.4, "r_y1": 381.49, "r_x2": 170.4, "r_y2": 372.902, "r_x3": 50.112, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "end deep learning model (i.e.", "orig": "end deep learning model (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.248, "r_y0": 381.49, "r_x1": 286.365, "r_y1": 381.49, "r_x2": 286.365, "r_y2": 372.902, "r_x3": 176.248, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder from", "orig": "encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 393.445, "r_x1": 196.572, "r_y1": 393.445, "r_x2": 196.572, "r_y2": 384.857, "r_x3": 50.112, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "PubTabNet) in two significant ways.", "orig": "PubTabNet) in two significant ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.643, "r_y0": 393.445, "r_x1": 286.365, "r_y1": 393.445, "r_x2": 286.365, "r_y2": 384.857, "r_x3": 201.643, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "First, we introduce a", "orig": "First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 405.4, "r_x1": 232.328, "r_y1": 405.4, "r_x2": 232.328, "r_y2": 396.812, "r_x3": 50.112, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "new object detection decoder for table-cells.", "orig": "new object detection decoder for table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.584, "r_y0": 405.4, "r_x1": 286.365, "r_y1": 405.4, "r_x2": 286.365, "r_y2": 396.812, "r_x3": 238.584, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "In this way,", "orig": "In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 417.355, "r_x1": 286.365, "r_y1": 417.355, "r_x2": 286.365, "r_y2": 408.767, "r_x3": 50.112, "r_y3": 408.767, "coord_origin": "TOPLEFT"}, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 429.311, "r_x1": 286.365, "r_y1": 429.311, "r_x2": 286.365, "r_y2": 420.723, "r_x3": 50.112, "r_y3": 420.723, "coord_origin": "TOPLEFT"}, "text": "matic PDF's directly from the PDF source and avoid the", "orig": "matic PDF's directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 441.266, "r_x1": 207.232, "r_y1": 441.266, "r_x2": 207.232, "r_y2": 432.678, "r_x3": 50.112, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.096, "r_y0": 441.266, "r_x1": 286.365, "r_y1": 441.266, "r_x2": 286.365, "r_y2": 432.678, "r_x3": 214.096, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 453.221, "r_x1": 286.365, "r_y1": 453.221, "r_x2": 286.365, "r_y2": 444.633, "r_x3": 50.112, "r_y3": 444.633, "coord_origin": "TOPLEFT"}, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 465.176, "r_x1": 204.233, "r_y1": 465.176, "r_x2": 204.233, "r_y2": 456.588, "r_x3": 50.112, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "allows us to tackle non-english tables.", "orig": "allows us to tackle non-english tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.587, "r_y0": 465.176, "r_x1": 286.365, "r_y1": 465.176, "r_x2": 286.365, "r_y2": 456.588, "r_x3": 208.587, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "Second, we replace", "orig": "Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 477.131, "r_x1": 286.365, "r_y1": 477.131, "r_x2": 286.365, "r_y2": 468.543, "r_x3": 50.112, "r_y3": 468.543, "coord_origin": "TOPLEFT"}, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 489.087, "r_x1": 286.365, "r_y1": 489.087, "r_x2": 286.365, "r_y2": 480.499, "r_x3": 50.112, "r_y3": 480.499, "coord_origin": "TOPLEFT"}, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.042, "r_x1": 286.365, "r_y1": 501.042, "r_x2": 286.365, "r_y2": 492.454, "r_x3": 50.112, "r_y3": 492.454, "coord_origin": "TOPLEFT"}, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 512.9970000000001, "r_x1": 276.652, "r_y1": 512.9970000000001, "r_x2": 276.652, "r_y2": 504.409, "r_x3": 50.112, "r_y3": 504.409, "coord_origin": "TOPLEFT"}, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.759, "r_y0": 569.604, "r_x1": 178.51, "r_y1": 569.604, "r_x2": 178.51, "r_y2": 561.052, "r_x3": 170.759, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.003, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 183.003, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "documents is ubiquitous.", "orig": "documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 119.95, "r_y1": 605.47, "r_x2": 119.95, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "tremely valuable.", "orig": "tremely valuable.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.778, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 125.778, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, this compact representa-", "orig": "Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 101.848, "r_y1": 701.111, "r_x2": 101.848, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "table-entries.", "orig": "table-entries.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 106.261, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 106.261, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Fig. 1 shows a table which presents all these", "orig": "Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 76.403, "r_y1": 713.066, "r_x2": 76.403, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.463, "r_y0": 333.15, "r_x1": 472.474, "r_y1": 333.15, "r_x2": 472.474, "r_y2": 324.837, "r_x3": 326.463, "r_y3": 324.837, "coord_origin": "TOPLEFT"}, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.176, "r_y0": 523.321, "r_x1": 545.115, "r_y1": 523.321, "r_x2": 545.115, "r_y2": 514.769, "r_x3": 353.176, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 535.2760000000001, "r_x1": 545.115, "r_y1": 535.2760000000001, "r_x2": 545.115, "r_y2": 526.7239999999999, "r_x3": 308.862, "r_y3": 526.7239999999999, "coord_origin": "TOPLEFT"}, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 547.231, "r_x1": 445.539, "r_y1": 547.231, "r_x2": 445.539, "r_y2": 538.679, "r_x3": 308.862, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "text and (3) cells with no content.", "orig": "text and (3) cells with no content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.221, "r_y0": 547.231, "r_x1": 545.115, "r_y1": 547.231, "r_x2": 545.115, "r_y2": 538.679, "r_x3": 450.221, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "Image from PubTabNet", "orig": "Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 559.187, "r_x1": 505.692, "r_y1": 559.187, "r_x2": 505.692, "r_y2": 550.635, "r_x3": 308.862, "r_y3": 550.635, "coord_origin": "TOPLEFT"}, "text": "evaluation set, filename: 'PMC2944238 004 02'.", "orig": "evaluation set, filename: 'PMC2944238 004 02'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.62, "r_y0": 593.23, "r_x1": 404.134, "r_y1": 593.23, "r_x2": 404.134, "r_y2": 584.678, "r_x3": 362.62, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "significant", "orig": "significant", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.259, "r_y0": 593.23, "r_x1": 545.115, "r_y1": 593.23, "r_x2": 545.115, "r_y2": 584.678, "r_x3": 408.259, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "progress has been made with vi-", "orig": "progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.185, "r_x1": 526.365, "r_y1": 605.185, "r_x2": 526.365, "r_y2": 596.633, "r_x3": 308.862, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "sion based approaches to extract tables in documents.", "orig": "sion based approaches to extract tables in documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.426, "r_y0": 605.185, "r_x1": 545.115, "r_y1": 605.185, "r_x2": 545.115, "r_y2": 596.633, "r_x3": 531.426, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "For", "orig": "For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.14, "r_x1": 545.115, "r_y1": 617.14, "r_x2": 545.115, "r_y2": 608.588, "r_x3": 308.862, "r_y3": 608.588, "coord_origin": "TOPLEFT"}, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.095, "r_x1": 545.115, "r_y1": 629.095, "r_x2": 545.115, "r_y2": 620.543, "r_x3": 308.862, "r_y3": 620.543, "coord_origin": "TOPLEFT"}, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0509999999999, "r_x1": 336.807, "r_y1": 641.0509999999999, "r_x2": 336.807, "r_y2": 632.499, "r_x3": 308.862, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "lenges,", "orig": "lenges,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.519, "r_y0": 641.0509999999999, "r_x1": 353.694, "r_y1": 641.0509999999999, "r_x2": 353.694, "r_y2": 632.499, "r_x3": 341.519, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.112, "r_y0": 641.0509999999999, "r_x1": 373.728, "r_y1": 641.0509999999999, "r_x2": 373.728, "r_y2": 632.499, "r_x3": 362.112, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.992, "r_y0": 641.0509999999999, "r_x1": 406.226, "r_y1": 641.0509999999999, "r_x2": 406.226, "r_y2": 632.499, "r_x3": 377.992, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.5, "r_y0": 641.0509999999999, "r_x1": 422.675, "r_y1": 641.0509999999999, "r_x2": 422.675, "r_y2": 632.499, "r_x3": 410.5, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 641.0509999999999, "r_x1": 459.038, "r_y1": 641.0509999999999, "r_x2": 459.038, "r_y2": 632.499, "r_x3": 426.939, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "location", "orig": "location", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.302, "r_y0": 641.0509999999999, "r_x1": 471.601, "r_y1": 641.0509999999999, "r_x2": 471.601, "r_y2": 632.499, "r_x3": 463.302, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.875, "r_y0": 641.0509999999999, "r_x1": 488.049, "r_y1": 641.0509999999999, "r_x2": 488.049, "r_y2": 632.499, "r_x3": 475.875, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.313, "r_y0": 641.0509999999999, "r_x1": 522.191, "r_y1": 641.0509999999999, "r_x2": 522.191, "r_y2": 632.499, "r_x3": 492.313, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "table(s)", "orig": "table(s)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.455, "r_y0": 641.0509999999999, "r_x1": 545.115, "r_y1": 641.0509999999999, "r_x2": 545.115, "r_y2": 632.499, "r_x3": 526.455, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "on a", "orig": "on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.006, "r_x1": 545.115, "r_y1": 653.006, "r_x2": 545.115, "r_y2": 644.454, "r_x3": 308.862, "r_y3": 644.454, "coord_origin": "TOPLEFT"}, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.961, "r_x1": 375.552, "r_y1": 664.961, "r_x2": 375.552, "r_y2": 656.409, "r_x3": 308.862, "r_y3": 656.409, "coord_origin": "TOPLEFT"}, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 474.261, "r_y1": 701.111, "r_x2": 474.261, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "of-the-art object-detection networks (e.g.", "orig": "of-the-art object-detection networks (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 479.342, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 479.342, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "YOLO and later", "orig": "YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 395.796, "r_y1": 713.066, "r_x2": 395.796, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "on Mask-RCNN [9]).", "orig": "on Mask-RCNN [9]).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.046, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 401.046, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "For all practical purposes, it can be", "orig": "For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 8, "label": "section_header", "bbox": {"l": 96.301, "t": 107.03399999999999, "r": 498.927, "b": 119.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8868067860603333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 142.477, "t": 147.00800000000004, "r": 452.75, "b": 157.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7586215734481812, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_header", "bbox": {"l": 18.34, "t": 160.0, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8773143887519836, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "key_value_region", "bbox": {"l": 208.123, "t": 176.562, "r": 212.731, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.4854728579521179, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 208.123, "t": 176.562, "r": 212.731, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9096331596374512, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 5, "label": "section_header", "bbox": {"l": 145.995, "t": 215.48299999999995, "r": 190.48, "b": 226.231, "coord_origin": "TOPLEFT"}, "confidence": 0.9258671402931213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "section_header", "bbox": {"l": 315.567, "t": 218.34900000000005, "r": 408.441, "b": 226.66200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6724023818969727, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 241.39499999999998, "r": 286.365, "b": 249.98299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9838882088661194, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "list_item", "bbox": {"l": 315.567, "t": 314.037, "r": 486.402, "b": 322.35, "coord_origin": "TOPLEFT"}, "confidence": 0.5549328923225403, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 315.567, "t": 420.525, "r": 491.191, "b": 428.838, "coord_origin": "TOPLEFT"}, "confidence": 0.5501358509063721, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "caption", "bbox": {"l": 308.862, "t": 514.769, "r": 345.734, "b": 523.321, "coord_origin": "TOPLEFT"}, "confidence": 0.9214619398117065, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "section_header", "bbox": {"l": 50.112, "t": 539.943, "r": 126.948, "b": 550.691, "coord_origin": "TOPLEFT"}, "confidence": 0.9317677617073059, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 561.052, "r": 166.266, "b": 569.604, "coord_origin": "TOPLEFT"}, "confidence": 0.9841895699501038, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 584.678, "r": 358.077, "b": 593.23, "coord_origin": "TOPLEFT"}, "confidence": 0.9848759770393372, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 668.649, "r": 545.115, "b": 677.201, "coord_origin": "TOPLEFT"}, "confidence": 0.979152262210846, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8045893311500549, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "picture", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.608779788017273, "cells": [], "children": []}, {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [], "children": []}, {"id": 10, "label": "picture", "bbox": {"l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT"}, "confidence": 0.8742761611938477, "cells": [], "children": []}, {"id": 23, "label": "picture", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.5088632702827454, "cells": [], "children": []}, {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"15": {"label": "table", "id": 15, "page_no": 0, "cluster": {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "11": {"label": "table", "id": 11, "page_no": 0, "cluster": {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "section_header", "id": 8, "page_no": 0, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 96.301, "t": 107.03399999999999, "r": 498.927, "b": 119.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8868067860603333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers."}, {"label": "section_header", "id": 13, "page_no": 0, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 142.477, "t": 147.00800000000004, "r": 452.75, "b": 157.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7586215734481812, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar"}, {"label": "page_header", "id": 9, "page_no": 0, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 18.34, "t": 160.0, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8773143887519836, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022"}, {"label": "key_value_region", "id": 25, "page_no": 0, "cluster": {"id": 25, "label": "key_value_region", "bbox": {"l": 208.123, "t": 176.562, "r": 212.731, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.4854728579521179, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 208.123, "t": 176.562, "r": 212.731, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9096331596374512, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null}, {"label": "section_header", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 145.995, "t": 215.48299999999995, "r": 190.48, "b": 226.231, "coord_origin": "TOPLEFT"}, "confidence": 0.9258671402931213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Abstract"}, {"label": "section_header", "id": 14, "page_no": 0, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 315.567, "t": 218.34900000000005, "r": 408.441, "b": 226.66200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6724023818969727, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Picture of a table:"}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 241.39499999999998, "r": 286.365, "b": 249.98299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9838882088661194, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tables organize valuable content in a concise and com-"}, {"label": "list_item", "id": 17, "page_no": 0, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 315.567, "t": 314.037, "r": 486.402, "b": 322.35, "coord_origin": "TOPLEFT"}, "confidence": 0.5549328923225403, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Red-annotation of bounding boxes,"}, {"label": "list_item", "id": 18, "page_no": 0, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 315.567, "t": 420.525, "r": 491.191, "b": 428.838, "coord_origin": "TOPLEFT"}, "confidence": 0.5501358509063721, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "c. Structure predicted by TableFormer:"}, {"label": "caption", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 308.862, "t": 514.769, "r": 345.734, "b": 523.321, "coord_origin": "TOPLEFT"}, "confidence": 0.9214619398117065, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 1:"}, {"label": "section_header", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 50.112, "t": 539.943, "r": 126.948, "b": 550.691, "coord_origin": "TOPLEFT"}, "confidence": 0.9317677617073059, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Introduction"}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 561.052, "r": 166.266, "b": 569.604, "coord_origin": "TOPLEFT"}, "confidence": 0.9841895699501038, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The occurrence of tables"}, {"label": "text", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 584.678, "r": 358.077, "b": 593.23, "coord_origin": "TOPLEFT"}, "confidence": 0.9848759770393372, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Recently,"}, {"label": "text", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 668.649, "r": 545.115, "b": 677.201, "coord_origin": "TOPLEFT"}, "confidence": 0.979152262210846, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The first problem is called table-location and has been"}, {"label": "page_footer", "id": 12, "page_no": 0, "cluster": {"id": 12, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8045893311500549, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1"}, {"label": "picture", "id": 16, "page_no": 0, "cluster": {"id": 16, "label": "picture", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.608779788017273, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 15, "page_no": 0, "cluster": {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 10, "page_no": 0, "cluster": {"id": 10, "label": "picture", "bbox": {"l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT"}, "confidence": 0.8742761611938477, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 23, "page_no": 0, "cluster": {"id": 23, "label": "picture", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.5088632702827454, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 0, "cluster": {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "section_header", "id": 8, "page_no": 0, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 96.301, "t": 107.03399999999999, "r": 498.927, "b": 119.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8868067860603333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers."}, {"label": "section_header", "id": 13, "page_no": 0, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 142.477, "t": 147.00800000000004, "r": 452.75, "b": 157.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7586215734481812, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar"}, {"label": "key_value_region", "id": 25, "page_no": 0, "cluster": {"id": 25, "label": "key_value_region", "bbox": {"l": 208.123, "t": 176.562, "r": 212.731, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.4854728579521179, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 208.123, "t": 176.562, "r": 212.731, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9096331596374512, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null}, {"label": "section_header", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 145.995, "t": 215.48299999999995, "r": 190.48, "b": 226.231, "coord_origin": "TOPLEFT"}, "confidence": 0.9258671402931213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Abstract"}, {"label": "section_header", "id": 14, "page_no": 0, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 315.567, "t": 218.34900000000005, "r": 408.441, "b": 226.66200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6724023818969727, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Picture of a table:"}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 241.39499999999998, "r": 286.365, "b": 249.98299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9838882088661194, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tables organize valuable content in a concise and com-"}, {"label": "list_item", "id": 17, "page_no": 0, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 315.567, "t": 314.037, "r": 486.402, "b": 322.35, "coord_origin": "TOPLEFT"}, "confidence": 0.5549328923225403, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Red-annotation of bounding boxes,"}, {"label": "list_item", "id": 18, "page_no": 0, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 315.567, "t": 420.525, "r": 491.191, "b": 428.838, "coord_origin": "TOPLEFT"}, "confidence": 0.5501358509063721, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "c. Structure predicted by TableFormer:"}, {"label": "caption", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 308.862, "t": 514.769, "r": 345.734, "b": 523.321, "coord_origin": "TOPLEFT"}, "confidence": 0.9214619398117065, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 1:"}, {"label": "section_header", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 50.112, "t": 539.943, "r": 126.948, "b": 550.691, "coord_origin": "TOPLEFT"}, "confidence": 0.9317677617073059, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Introduction"}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 561.052, "r": 166.266, "b": 569.604, "coord_origin": "TOPLEFT"}, "confidence": 0.9841895699501038, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The occurrence of tables"}, {"label": "text", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 584.678, "r": 358.077, "b": 593.23, "coord_origin": "TOPLEFT"}, "confidence": 0.9848759770393372, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Recently,"}, {"label": "text", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 668.649, "r": 545.115, "b": 677.201, "coord_origin": "TOPLEFT"}, "confidence": 0.979152262210846, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The first problem is called table-location and has been"}, {"label": "picture", "id": 16, "page_no": 0, "cluster": {"id": 16, "label": "picture", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.608779788017273, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 15, "page_no": 0, "cluster": {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 10, "page_no": 0, "cluster": {"id": 10, "label": "picture", "bbox": {"l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT"}, "confidence": 0.8742761611938477, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 23, "page_no": 0, "cluster": {"id": 23, "label": "picture", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.5088632702827454, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 0, "cluster": {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_header", "id": 9, "page_no": 0, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 18.34, "t": 160.0, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8773143887519836, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022"}, {"label": "page_footer", "id": 12, "page_no": 0, "cluster": {"id": 12, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8045893311500549, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1"}]}}, {"page_no": 1, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 112.647, "r_y1": 95.98400000000004, "r_x2": 112.647, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 120.34699999999998, "r_x1": 74.75, "r_y1": 120.34699999999998, "r_x2": 74.75, "r_y2": 111.79499999999996, "r_x3": 50.112, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.335, "r_y0": 120.34699999999998, "r_x1": 286.365, "r_y1": 120.34699999999998, "r_x2": 286.365, "r_y2": 111.79499999999996, "r_x3": 81.335, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 132.30200000000002, "r_x1": 235.117, "r_y1": 132.30200000000002, "r_x2": 235.117, "r_y2": 123.75, "r_x3": 50.112, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "munity of document understanding [6, 4, 14].", "orig": "munity of document understanding [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.079, "r_y0": 132.30200000000002, "r_x1": 286.365, "r_y1": 132.30200000000002, "r_x2": 286.365, "r_y2": 123.75, "r_x3": 240.079, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "Contrary to", "orig": "Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 144.25699999999995, "r_x1": 286.365, "r_y1": 144.25699999999995, "r_x2": 286.365, "r_y2": 135.70500000000004, "r_x3": 50.112, "r_y3": 135.70500000000004, "coord_origin": "TOPLEFT"}, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 156.21299999999997, "r_x1": 286.365, "r_y1": 156.21299999999997, "r_x2": 286.365, "r_y2": 147.66099999999994, "r_x3": 50.112, "r_y3": 147.66099999999994, "coord_origin": "TOPLEFT"}, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 168.168, "r_x1": 286.365, "r_y1": 168.168, "r_x2": 286.365, "r_y2": 159.61599999999999, "r_x3": 50.112, "r_y3": 159.61599999999999, "coord_origin": "TOPLEFT"}, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.12300000000005, "r_x1": 286.365, "r_y1": 180.12300000000005, "r_x2": 286.365, "r_y2": 171.57100000000003, "r_x3": 50.112, "r_y3": 171.57100000000003, "coord_origin": "TOPLEFT"}, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.07799999999997, "r_x1": 286.365, "r_y1": 192.07799999999997, "r_x2": 286.365, "r_y2": 183.52599999999995, "r_x3": 50.112, "r_y3": 183.52599999999995, "coord_origin": "TOPLEFT"}, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.03300000000002, "r_x1": 114.51, "r_y1": 204.03300000000002, "r_x2": 114.51, "r_y2": 195.481, "r_x3": 50.112, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "nesses (see Sec.", "orig": "nesses (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.163, "r_y0": 204.03300000000002, "r_x1": 129.952, "r_y1": 204.03300000000002, "r_x2": 129.952, "r_y2": 195.481, "r_x3": 119.163, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "2).", "orig": "2).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.615, "r_y0": 204.03300000000002, "r_x1": 286.365, "r_y1": 204.03300000000002, "r_x2": 286.365, "r_y2": 195.481, "r_x3": 134.615, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "The common denominator here is the", "orig": "The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.98800000000006, "r_x1": 286.365, "r_y1": 215.98800000000006, "r_x2": 286.365, "r_y2": 207.43600000000004, "r_x3": 50.112, "r_y3": 207.43600000000004, "coord_origin": "TOPLEFT"}, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.94399999999996, "r_x1": 278.664, "r_y1": 227.94399999999996, "r_x2": 278.664, "r_y2": 219.39200000000005, "r_x3": 50.112, "r_y3": 219.39200000000005, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 252.30700000000002, "r_x1": 78.884, "r_y1": 252.30700000000002, "r_x2": 78.884, "r_y2": 243.755, "r_x3": 50.112, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "present", "orig": "present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 83.068, "r_y0": 252.30700000000002, "r_x1": 116.373, "r_y1": 252.30700000000002, "r_x2": 116.373, "r_y2": 243.755, "r_x3": 83.068, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "a robust", "orig": "a robust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 120.558, "r_y0": 252.30700000000002, "r_x1": 178.102, "r_y1": 252.30700000000002, "r_x2": 178.102, "r_y2": 243.755, "r_x3": 120.558, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.276, "r_y0": 252.30700000000002, "r_x1": 286.365, "r_y1": 252.30700000000002, "r_x2": 286.365, "r_y2": 243.755, "r_x3": 182.276, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "decomposition algorithm.", "orig": "decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.26199999999994, "r_x1": 260.432, "r_y1": 264.26199999999994, "r_x2": 260.432, "r_y2": 255.71000000000004, "r_x3": 50.112, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "The design criteria for our model are the following.", "orig": "The design criteria for our model are the following.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.603, "r_y0": 264.26199999999994, "r_x1": 286.365, "r_y1": 264.26199999999994, "r_x2": 286.365, "r_y2": 255.71000000000004, "r_x3": 265.603, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "First,", "orig": "First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.217, "r_x1": 286.365, "r_y1": 276.217, "r_x2": 286.365, "r_y2": 267.66499999999996, "r_x3": 50.112, "r_y3": 267.66499999999996, "coord_origin": "TOPLEFT"}, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.172, "r_x1": 286.365, "r_y1": 288.172, "r_x2": 286.365, "r_y2": 279.62, "r_x3": 50.112, "r_y3": 279.62, "coord_origin": "TOPLEFT"}, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.128, "r_x1": 88.568, "r_y1": 300.128, "r_x2": 88.568, "r_y2": 291.576, "r_x3": 50.112, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 95.502, "r_y0": 300.128, "r_x1": 286.365, "r_y1": 300.128, "r_x2": 286.365, "r_y2": 291.576, "r_x3": 95.502, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.083, "r_x1": 286.365, "r_y1": 312.083, "r_x2": 286.365, "r_y2": 303.531, "r_x3": 50.112, "r_y3": 303.531, "coord_origin": "TOPLEFT"}, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.038, "r_x1": 286.365, "r_y1": 324.038, "r_x2": 286.365, "r_y2": 315.486, "r_x3": 50.112, "r_y3": 315.486, "coord_origin": "TOPLEFT"}, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.993, "r_x1": 286.365, "r_y1": 335.993, "r_x2": 286.365, "r_y2": 327.441, "r_x3": 50.112, "r_y3": 327.441, "coord_origin": "TOPLEFT"}, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.948, "r_x1": 286.365, "r_y1": 347.948, "r_x2": 286.365, "r_y2": 339.396, "r_x3": 50.112, "r_y3": 339.396, "coord_origin": "TOPLEFT"}, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.904, "r_x1": 286.365, "r_y1": 359.904, "r_x2": 286.365, "r_y2": 351.352, "r_x3": 50.112, "r_y3": 351.352, "coord_origin": "TOPLEFT"}, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.859, "r_x1": 76.951, "r_y1": 371.859, "r_x2": 76.951, "r_y2": 363.307, "r_x3": 50.112, "r_y3": 363.307, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.222, "r_x1": 120.986, "r_y1": 396.222, "r_x2": 120.986, "r_y2": 387.67, "r_x3": 50.112, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.901, "r_y0": 396.238, "r_x1": 179.731, "r_y1": 396.238, "r_x2": 179.731, "r_y2": 387.282, "r_x3": 123.901, "r_y3": 387.282, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.646, "r_y0": 396.222, "r_x1": 286.367, "r_y1": 396.222, "r_x2": 286.367, "r_y2": 387.67, "r_x3": 182.646, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.177, "r_x1": 181.758, "r_y1": 408.177, "r_x2": 181.758, "r_y2": 399.625, "r_x3": 50.112, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.104, "r_y0": 408.193, "r_x1": 240.203, "r_y1": 408.193, "r_x2": 240.203, "r_y2": 399.237, "r_x3": 184.104, "r_y3": 399.237, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.204, "r_y0": 403.942, "r_x1": 243.691, "r_y1": 403.942, "r_x2": 243.691, "r_y2": 397.956, "r_x3": 240.204, "r_y3": 397.956, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.189, "r_y0": 408.177, "r_x1": 246.68, "r_y1": 408.177, "r_x2": 246.68, "r_y2": 399.625, "r_x3": 244.189, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.718, "r_y0": 408.177, "r_x1": 286.361, "r_y1": 408.177, "r_x2": 286.361, "r_y2": 399.625, "r_x3": 249.718, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "In partic-", "orig": "In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.132, "r_x1": 67.696, "r_y1": 420.132, "r_x2": 67.696, "r_y2": 411.58, "r_x3": 50.112, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "ular,", "orig": "ular,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.322, "r_y0": 420.132, "r_x1": 286.365, "r_y1": 420.132, "r_x2": 286.365, "r_y2": 411.58, "r_x3": 71.322, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "our contributions in this work can be summarised as", "orig": "our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.087, "r_x1": 82.52, "r_y1": 432.087, "r_x2": 82.52, "r_y2": 423.535, "r_x3": 50.112, "r_y3": 423.535, "coord_origin": "TOPLEFT"}, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 453.372, "r_x1": 117.101, "r_y1": 453.372, "r_x2": 117.101, "r_y2": 444.82, "r_x3": 70.037, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.59, "r_y0": 453.388, "r_x1": 175.42, "r_y1": 453.388, "r_x2": 175.42, "r_y2": 444.432, "r_x3": 119.59, "r_y3": 444.432, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.421, "r_y0": 453.372, "r_x1": 286.365, "r_y1": 453.372, "r_x2": 286.365, "r_y2": 444.82, "r_x3": 175.421, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 465.327, "r_x1": 286.365, "r_y1": 465.327, "r_x2": 286.365, "r_y2": 456.775, "r_x3": 70.037, "r_y3": 456.775, "coord_origin": "TOPLEFT"}, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 477.282, "r_x1": 286.365, "r_y1": 477.282, "r_x2": 286.365, "r_y2": 468.73, "r_x3": 70.037, "r_y3": 468.73, "coord_origin": "TOPLEFT"}, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 489.237, "r_x1": 99.636, "r_y1": 489.237, "r_x2": 99.636, "r_y2": 480.685, "r_x3": 70.037, "r_y3": 480.685, "coord_origin": "TOPLEFT"}, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 510.974, "r_x1": 111.88, "r_y1": 510.974, "r_x2": 111.88, "r_y2": 502.422, "r_x3": 70.037, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "Across all", "orig": "Across all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.084, "r_y0": 510.974, "r_x1": 196.104, "r_y1": 510.974, "r_x2": 196.104, "r_y2": 502.422, "r_x3": 116.084, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "benchmark datasets", "orig": "benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.034, "r_x3": 200.31, "r_y3": 502.034, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.35, "r_y0": 510.974, "r_x1": 286.362, "r_y1": 510.974, "r_x2": 286.362, "r_y2": 502.422, "r_x3": 260.35, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 522.929, "r_x1": 97.155, "r_y1": 522.929, "r_x2": 97.155, "r_y2": 514.377, "r_x3": 70.037, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "icantly", "orig": "icantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.678, "r_y0": 522.929, "r_x1": 150.375, "r_y1": 522.929, "r_x2": 150.375, "r_y2": 514.377, "r_x3": 101.678, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "outperforms", "orig": "outperforms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.898, "r_y0": 522.929, "r_x1": 186.301, "r_y1": 522.929, "r_x2": 186.301, "r_y2": 514.377, "r_x3": 154.898, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "existing", "orig": "existing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.824, "r_y0": 522.929, "r_x1": 250.021, "r_y1": 522.929, "r_x2": 250.021, "r_y2": 514.377, "r_x3": 190.824, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.544, "r_y0": 522.929, "r_x1": 286.365, "r_y1": 522.929, "r_x2": 286.365, "r_y2": 514.377, "r_x3": 254.544, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "metrics,", "orig": "metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 534.885, "r_x1": 286.365, "r_y1": 534.885, "r_x2": 286.365, "r_y2": 526.3330000000001, "r_x3": 70.037, "r_y3": 526.3330000000001, "coord_origin": "TOPLEFT"}, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 546.84, "r_x1": 161.653, "r_y1": 546.84, "r_x2": 161.653, "r_y2": 538.288, "r_x3": 70.037, "r_y3": 538.288, "coord_origin": "TOPLEFT"}, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 568.577, "r_x1": 116.712, "r_y1": 568.577, "r_x2": 116.712, "r_y2": 560.025, "r_x3": 70.037, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.583, "r_y0": 568.593, "r_x1": 177.682, "r_y1": 568.593, "r_x2": 177.682, "r_y2": 559.637, "r_x3": 121.583, "r_y3": 559.637, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.553, "r_y0": 568.577, "r_x1": 186.976, "r_y1": 568.577, "r_x2": 186.976, "r_y2": 560.025, "r_x3": 182.553, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.848, "r_y0": 568.577, "r_x1": 242.767, "r_y1": 568.577, "r_x2": 242.767, "r_y2": 560.025, "r_x3": 191.848, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "synthetically", "orig": "synthetically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.639, "r_y0": 568.577, "r_x1": 286.363, "r_y1": 568.577, "r_x2": 286.363, "r_y2": 560.025, "r_x3": 247.639, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "generated", "orig": "generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 580.532, "r_x1": 286.365, "r_y1": 580.532, "r_x2": 286.365, "r_y2": 571.98, "r_x3": 70.037, "r_y3": 571.98, "coord_origin": "TOPLEFT"}, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 592.487, "r_x1": 82.401, "r_y1": 592.487, "r_x2": 82.401, "r_y2": 583.935, "r_x3": 70.037, "r_y3": 583.935, "coord_origin": "TOPLEFT"}, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 614.2239999999999, "r_x1": 132.005, "r_y1": 614.2239999999999, "r_x2": 132.005, "r_y2": 605.672, "r_x3": 70.037, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "An augmented", "orig": "An augmented", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.082, "r_y0": 614.2239999999999, "r_x1": 165.748, "r_y1": 614.2239999999999, "r_x2": 165.748, "r_y2": 605.672, "r_x3": 138.082, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "dataset", "orig": "dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.815, "r_y0": 614.2239999999999, "r_x1": 194.5, "r_y1": 614.2239999999999, "r_x2": 194.5, "r_y2": 605.672, "r_x3": 171.815, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "based", "orig": "based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.577, "r_y0": 614.2239999999999, "r_x1": 210.54, "r_y1": 614.2239999999999, "r_x2": 210.54, "r_y2": 605.672, "r_x3": 200.577, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.617, "r_y0": 614.2239999999999, "r_x1": 261.2, "r_y1": 614.2239999999999, "r_x2": 261.2, "r_y2": 605.672, "r_x3": 216.617, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.277, "r_y0": 614.2239999999999, "r_x1": 286.365, "r_y1": 614.2239999999999, "r_x2": 286.365, "r_y2": 605.672, "r_x3": 267.277, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "[37],", "orig": "[37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 626.179, "r_x1": 135.521, "r_y1": 626.179, "r_x2": 135.521, "r_y2": 617.627, "r_x3": 70.037, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36],", "orig": "FinTabNet [36],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.925, "r_y0": 626.179, "r_x1": 286.365, "r_y1": 626.179, "r_x2": 286.365, "r_y2": 617.627, "r_x3": 139.925, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "and TableBank [17] with generated", "orig": "and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 638.135, "r_x1": 198.056, "r_y1": 638.135, "r_x2": 198.056, "r_y2": 629.583, "r_x3": 70.037, "r_y3": 629.583, "coord_origin": "TOPLEFT"}, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.789, "r_y0": 659.419, "r_x1": 286.365, "r_y1": 659.419, "r_x2": 286.365, "r_y2": 650.867, "r_x3": 210.789, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "In Sec. 2, we give", "orig": "In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 671.374, "r_x1": 240.896, "r_y1": 671.374, "r_x2": 240.896, "r_y2": 662.822, "r_x3": 50.112, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "a brief overview of the current state-of-the-art.", "orig": "a brief overview of the current state-of-the-art.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.833, "r_y0": 671.374, "r_x1": 286.365, "r_y1": 671.374, "r_x2": 286.365, "r_y2": 662.822, "r_x3": 246.833, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "In Sec. 3,", "orig": "In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 683.329, "r_x1": 227.396, "r_y1": 683.329, "r_x2": 227.396, "r_y2": 674.777, "r_x3": 50.112, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "we describe the datasets on which we train.", "orig": "we describe the datasets on which we train.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.467, "r_y0": 683.329, "r_x1": 286.365, "r_y1": 683.329, "r_x2": 286.365, "r_y2": 674.777, "r_x3": 232.467, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "In Sec. 4, we", "orig": "In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 695.284, "r_x1": 286.365, "r_y1": 695.284, "r_x2": 286.365, "r_y2": 686.732, "r_x3": 50.112, "r_y3": 686.732, "coord_origin": "TOPLEFT"}, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.458, "r_y0": 712.653, "r_x1": 183.731, "r_y1": 712.653, "r_x2": 183.731, "r_y2": 705.811, "r_x3": 64.458, "r_y3": 705.811, "coord_origin": "TOPLEFT"}, "text": "https://github.com/IBM/SynthTabNet", "orig": "https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 508.084, "r_y1": 107.93899999999996, "r_x2": 508.084, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 162.99699999999996, "r_x1": 545.115, "r_y1": 162.99699999999996, "r_x2": 545.115, "r_y2": 154.44500000000005, "r_x3": 308.862, "r_y3": 154.44500000000005, "coord_origin": "TOPLEFT"}, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 174.952, "r_x1": 334.376, "r_y1": 174.952, "r_x2": 334.376, "r_y2": 166.39999999999998, "r_x3": 308.862, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "tivates", "orig": "tivates", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.192, "r_y0": 174.952, "r_x1": 522.56, "r_y1": 174.952, "r_x2": 522.56, "r_y2": 166.39999999999998, "r_x3": 338.192, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "many organised public challenges [6, 4, 14].", "orig": "many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 174.952, "r_x1": 545.115, "r_y1": 174.952, "r_x2": 545.115, "r_y2": 166.39999999999998, "r_x3": 529.623, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 186.90700000000004, "r_x1": 545.115, "r_y1": 186.90700000000004, "r_x2": 545.115, "r_y2": 178.35500000000002, "r_x3": 308.862, "r_y3": 178.35500000000002, "coord_origin": "TOPLEFT"}, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 198.86199999999997, "r_x1": 545.115, "r_y1": 198.86199999999997, "r_x2": 545.115, "r_y2": 190.30999999999995, "r_x3": 308.862, "r_y3": 190.30999999999995, "coord_origin": "TOPLEFT"}, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 210.817, "r_x1": 346.979, "r_y1": 210.817, "r_x2": 346.979, "r_y2": 202.265, "r_x3": 308.862, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.869, "r_y0": 210.817, "r_x1": 508.642, "r_y1": 210.817, "r_x2": 508.642, "r_y2": 202.265, "r_x3": 354.869, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "Such large variety requires a flexible", "orig": "Such large variety requires a flexible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.737, "r_y0": 210.817, "r_x1": 545.115, "r_y1": 210.817, "r_x2": 545.115, "r_y2": 202.265, "r_x3": 512.737, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 222.77300000000002, "r_x1": 545.115, "r_y1": 222.77300000000002, "r_x2": 545.115, "r_y2": 214.221, "r_x3": 308.862, "r_y3": 214.221, "coord_origin": "TOPLEFT"}, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 234.72799999999995, "r_x1": 322.969, "r_y1": 234.72799999999995, "r_x2": 322.969, "r_y2": 226.17600000000004, "r_x3": 308.862, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "ers,", "orig": "ers,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.084, "r_y0": 234.72799999999995, "r_x1": 530.918, "r_y1": 234.72799999999995, "r_x2": 530.918, "r_y2": 226.17600000000004, "r_x3": 327.084, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "which can be extremely intricate and demanding.", "orig": "which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.922, "r_y0": 234.72799999999995, "r_x1": 545.115, "r_y1": 234.72799999999995, "r_x2": 545.115, "r_y2": 226.17600000000004, "r_x3": 537.922, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 246.683, "r_x1": 545.115, "r_y1": 246.683, "r_x2": 545.115, "r_y2": 238.13099999999997, "r_x3": 308.862, "r_y3": 238.13099999999997, "coord_origin": "TOPLEFT"}, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.63800000000003, "r_x1": 545.115, "r_y1": 258.63800000000003, "r_x2": 545.115, "r_y2": 250.086, "r_x3": 308.862, "r_y3": 250.086, "coord_origin": "TOPLEFT"}, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.59299999999996, "r_x1": 439.84, "r_y1": 270.59299999999996, "r_x2": 439.84, "r_y2": 262.04100000000005, "r_x3": 308.862, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.44, "r_y0": 270.429, "r_x1": 452.189, "r_y1": 270.429, "r_x2": 452.189, "r_y2": 261.72299999999996, "r_x3": 444.44, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.89, "r_y0": 270.429, "r_x1": 470.834, "r_y1": 270.429, "r_x2": 470.834, "r_y2": 261.72299999999996, "r_x3": 455.89, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 470.834, "r_y0": 270.59299999999996, "r_x1": 545.115, "r_y1": 270.59299999999996, "r_x2": 545.115, "r_y2": 262.04100000000005, "r_x3": 470.834, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.548, "r_x1": 545.115, "r_y1": 282.548, "r_x2": 545.115, "r_y2": 273.996, "r_x3": 308.862, "r_y3": 273.996, "coord_origin": "TOPLEFT"}, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.504, "r_x1": 545.115, "r_y1": 294.504, "r_x2": 545.115, "r_y2": 285.952, "r_x3": 308.862, "r_y3": 285.952, "coord_origin": "TOPLEFT"}, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 306.459, "r_x1": 545.115, "r_y1": 306.459, "r_x2": 545.115, "r_y2": 297.907, "r_x3": 308.862, "r_y3": 297.907, "coord_origin": "TOPLEFT"}, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.414, "r_x1": 545.115, "r_y1": 318.414, "r_x2": 545.115, "r_y2": 309.862, "r_x3": 308.862, "r_y3": 309.862, "coord_origin": "TOPLEFT"}, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.369, "r_x1": 425.923, "r_y1": 330.369, "r_x2": 425.923, "r_y2": 321.817, "r_x3": 308.862, "r_y3": 321.817, "coord_origin": "TOPLEFT"}, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.845, "r_y0": 342.39, "r_x1": 436.802, "r_y1": 342.39, "r_x2": 436.802, "r_y2": 333.838, "r_x3": 395.845, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "popularity", "orig": "popularity", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.145, "r_y0": 342.39, "r_x1": 449.444, "r_y1": 342.39, "r_x2": 449.444, "r_y2": 333.838, "r_x3": 441.145, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.798, "r_y0": 342.39, "r_x1": 545.115, "r_y1": 342.39, "r_x2": 545.115, "r_y2": 333.838, "r_x3": 453.798, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "deep neural networks,", "orig": "deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.345, "r_x1": 545.115, "r_y1": 354.345, "r_x2": 545.115, "r_y2": 345.793, "r_x3": 308.862, "r_y3": 345.793, "coord_origin": "TOPLEFT"}, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.3, "r_x1": 545.115, "r_y1": 366.3, "r_x2": 545.115, "r_y2": 357.748, "r_x3": 308.862, "r_y3": 357.748, "coord_origin": "TOPLEFT"}, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.256, "r_x1": 324.633, "r_y1": 378.256, "r_x2": 324.633, "r_y2": 369.704, "r_x3": 308.862, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "28].", "orig": "28].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.634, "r_y0": 378.256, "r_x1": 545.115, "r_y1": 378.256, "r_x2": 545.115, "r_y2": 369.704, "r_x3": 329.634, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "Although such methods work well on constrained ta-", "orig": "Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 390.211, "r_x1": 545.115, "r_y1": 390.211, "r_x2": 545.115, "r_y2": 381.659, "r_x3": 308.862, "r_y3": 381.659, "coord_origin": "TOPLEFT"}, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 402.166, "r_x1": 545.115, "r_y1": 402.166, "r_x2": 545.115, "r_y2": 393.614, "r_x3": 308.862, "r_y3": 393.614, "coord_origin": "TOPLEFT"}, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 414.121, "r_x1": 438.416, "r_y1": 414.121, "r_x2": 438.416, "r_y2": 405.569, "r_x3": 308.862, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "the availability of large datasets.", "orig": "the availability of large datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.231, "r_y0": 414.121, "r_x1": 545.115, "r_y1": 414.121, "r_x2": 545.115, "r_y2": 405.569, "r_x3": 442.231, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "To the best-of-our knowl-", "orig": "To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 426.076, "r_x1": 545.115, "r_y1": 426.076, "r_x2": 545.115, "r_y2": 417.524, "r_x3": 308.862, "r_y3": 417.524, "coord_origin": "TOPLEFT"}, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 438.032, "r_x1": 545.115, "r_y1": 438.032, "r_x2": 545.115, "r_y2": 429.48, "r_x3": 308.862, "r_y3": 429.48, "coord_origin": "TOPLEFT"}, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.987, "r_x1": 401.285, "r_y1": 449.987, "r_x2": 401.285, "r_y2": 441.435, "r_x3": 308.862, "r_y3": 441.435, "coord_origin": "TOPLEFT"}, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.267, "r_y0": 462.008, "r_x1": 426.037, "r_y1": 462.008, "r_x2": 426.037, "r_y2": 453.456, "r_x3": 423.267, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.769, "r_y0": 462.008, "r_x1": 545.11, "r_y1": 462.008, "r_x2": 545.11, "r_y2": 453.456, "r_x3": 430.769, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": "In this type of network, one", "orig": "In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.963, "r_x1": 340.404, "r_y1": 473.963, "r_x2": 340.404, "r_y2": 465.411, "r_x3": 308.862, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "predicts", "orig": "predicts", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.116, "r_y0": 473.963, "r_x1": 349.539, "r_y1": 473.963, "r_x2": 349.539, "r_y2": 465.411, "r_x3": 345.116, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.252, "r_y0": 473.963, "r_x1": 390.765, "r_y1": 473.963, "r_x2": 390.765, "r_y2": 465.411, "r_x3": 354.252, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.477, "r_y0": 473.963, "r_x1": 403.776, "r_y1": 473.963, "r_x2": 403.776, "r_y2": 465.411, "r_x3": 395.477, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.488, "r_y0": 473.963, "r_x1": 434.401, "r_y1": 473.963, "r_x2": 434.401, "r_y2": 465.411, "r_x3": 408.488, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.113, "r_y0": 473.963, "r_x1": 469.001, "r_y1": 473.963, "r_x2": 469.001, "r_y2": 465.411, "r_x3": 439.113, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "starting", "orig": "starting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.713, "r_y0": 473.963, "r_x1": 545.115, "r_y1": 473.963, "r_x2": 545.115, "r_y2": 465.411, "r_x3": 473.713, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "from an encoded", "orig": "from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.918, "r_x1": 335.701, "r_y1": 485.918, "r_x2": 335.701, "r_y2": 477.366, "r_x3": 308.862, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.853, "r_y0": 485.918, "r_x1": 411.009, "r_y1": 485.918, "r_x2": 411.009, "r_y2": 477.366, "r_x3": 345.853, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "Such sequences", "orig": "Such sequences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.85, "r_y0": 485.918, "r_x1": 424.149, "r_y1": 485.918, "r_x2": 424.149, "r_y2": 477.366, "r_x3": 415.85, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.001, "r_y0": 485.918, "r_x1": 454.914, "r_y1": 485.918, "r_x2": 454.914, "r_y2": 477.366, "r_x3": 429.001, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.756, "r_y0": 485.918, "r_x1": 473.584, "r_y1": 485.918, "r_x2": 473.584, "r_y2": 477.366, "r_x3": 459.756, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.425, "r_y0": 485.918, "r_x1": 487.83, "r_y1": 485.918, "r_x2": 487.83, "r_y2": 477.366, "r_x3": 478.425, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "be", "orig": "be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.682, "r_y0": 485.918, "r_x1": 545.115, "r_y1": 485.918, "r_x2": 545.115, "r_y2": 477.366, "r_x3": 492.682, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "HTML table", "orig": "HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.873, "r_x1": 459.218, "r_y1": 497.873, "r_x2": 459.218, "r_y2": 489.321, "r_x3": 308.862, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "tags [37, 17] or LaTeX symbols[10].", "orig": "tags [37, 17] or LaTeX symbols[10].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.115, "r_y0": 497.873, "r_x1": 545.115, "r_y1": 497.873, "r_x2": 545.115, "r_y2": 489.321, "r_x3": 465.115, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "The choice of sym-", "orig": "The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.828, "r_x1": 545.115, "r_y1": 509.828, "r_x2": 545.115, "r_y2": 501.276, "r_x3": 308.862, "r_y3": 501.276, "coord_origin": "TOPLEFT"}, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.784, "r_x1": 396.692, "r_y1": 521.784, "r_x2": 396.692, "r_y2": 513.232, "r_x3": 308.862, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "formed into the other.", "orig": "formed into the other.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.265, "r_y0": 521.784, "r_x1": 545.115, "r_y1": 521.784, "r_x2": 545.115, "r_y2": 513.232, "r_x3": 401.265, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "There are however subtle variations", "orig": "There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.739, "r_x1": 433.484, "r_y1": 533.739, "r_x2": 433.484, "r_y2": 525.187, "r_x3": 308.862, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "in the Image-to-Text networks.", "orig": "in the Image-to-Text networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.187, "r_y0": 533.739, "r_x1": 545.115, "r_y1": 533.739, "r_x2": 545.115, "r_y2": 525.187, "r_x3": 438.187, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "The easiest network archi-", "orig": "The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.694, "r_x1": 420.941, "r_y1": 545.694, "r_x2": 420.941, "r_y2": 537.142, "r_x3": 308.862, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "tectures are 'image-encoder", "orig": "tectures are 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.595, "r_y0": 545.388, "r_x1": 433.558, "r_y1": 545.388, "r_x2": 433.558, "r_y2": 536.8240000000001, "r_x3": 423.595, "r_y3": 536.8240000000001, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.212, "r_y0": 545.694, "r_x1": 545.113, "r_y1": 545.694, "r_x2": 545.113, "r_y2": 537.142, "r_x3": 436.212, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "text-decoder' (IETD), sim-", "orig": "text-decoder' (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.649, "r_x1": 545.115, "r_y1": 557.649, "r_x2": 545.115, "r_y2": 549.097, "r_x3": 308.862, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.604, "r_x1": 545.115, "r_y1": 569.604, "r_x2": 545.115, "r_y2": 561.052, "r_x3": 308.862, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.559, "r_x1": 503.671, "r_y1": 581.559, "r_x2": 503.671, "r_y2": 573.0070000000001, "r_x3": 308.862, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the LaTeX/HTML string of the entire table, i.e.", "orig": "the LaTeX/HTML string of the entire table, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 509.579, "r_y0": 581.559, "r_x1": 545.115, "r_y1": 581.559, "r_x2": 545.115, "r_y2": 573.0070000000001, "r_x3": 509.579, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the sym-", "orig": "the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.515, "r_x1": 545.115, "r_y1": 593.515, "r_x2": 545.115, "r_y2": 584.963, "r_x3": 308.862, "r_y3": 584.963, "coord_origin": "TOPLEFT"}, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.47, "r_x1": 330.72, "r_y1": 605.47, "r_x2": 330.72, "r_y2": 596.918, "r_x3": 308.862, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "table.", "orig": "table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.536, "r_y0": 605.47, "r_x1": 497.075, "r_y1": 605.47, "r_x2": 497.075, "r_y2": 596.918, "r_x3": 334.536, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Another approach is the 'image-encoder", "orig": "Another approach is the 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.805, "r_y0": 605.164, "r_x1": 509.768, "r_y1": 605.164, "r_x2": 509.768, "r_y2": 596.6, "r_x3": 499.805, "r_y3": 596.6, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.501, "r_y0": 605.47, "r_x1": 545.109, "r_y1": 605.47, "r_x2": 545.109, "r_y2": 596.918, "r_x3": 512.501, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.425, "r_x1": 545.115, "r_y1": 617.425, "r_x2": 545.115, "r_y2": 608.873, "r_x3": 308.862, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "coder' (IEDD) networks. In these type of networks, one has", "orig": "coder' (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.38, "r_x1": 545.115, "r_y1": 629.38, "r_x2": 545.115, "r_y2": 620.828, "r_x3": 308.862, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.335, "r_x1": 364.782, "r_y1": 641.335, "r_x2": 364.782, "r_y2": 632.783, "r_x3": 308.862, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.574, "r_y0": 641.192, "r_x1": 415.614, "r_y1": 641.192, "r_x2": 415.614, "r_y2": 632.604, "r_x3": 367.574, "r_y3": 632.604, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.613, "r_y0": 641.335, "r_x1": 418.104, "r_y1": 641.335, "r_x2": 418.104, "r_y2": 632.783, "r_x3": 415.613, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.963, "r_y0": 641.335, "r_x1": 433.137, "r_y1": 641.335, "r_x2": 433.137, "r_y2": 632.783, "r_x3": 420.963, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.122, "r_y0": 641.335, "r_x1": 442.661, "r_y1": 641.335, "r_x2": 442.661, "r_y2": 632.783, "r_x3": 437.122, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.441, "r_y0": 641.335, "r_x1": 545.117, "r_y1": 641.335, "r_x2": 545.117, "r_y2": 632.783, "r_x3": 445.441, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "only produces the HTM-", "orig": "only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.103, "r_x1": 373.599, "r_y1": 665.103, "r_x2": 373.599, "r_y2": 656.515, "r_x3": 308.862, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.907, "r_y0": 665.246, "r_x1": 545.116, "r_y1": 665.246, "r_x2": 545.116, "r_y2": 656.694, "r_x3": 376.907, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.013, "r_x1": 356.902, "r_y1": 689.013, "r_x2": 356.902, "r_y2": 680.425, "r_x3": 308.862, "r_y3": 680.425, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.131, "r_y0": 689.156, "r_x1": 360.449, "r_y1": 689.156, "r_x2": 360.449, "r_y2": 680.604, "r_x3": 357.131, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.045, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 364.045, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "to generate the textual content of each table", "orig": "to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 325.739, "r_y1": 701.111, "r_x2": 325.739, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.746, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 331.746, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "The network architecture of IEDD is certainly more", "orig": "The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 12, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9656890034675598, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9774322509765625, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 99.84000000000003, "r": 286.365, "b": 108.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9838606119155884, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 308.862, "t": 121.73199999999997, "r": 498.28, "b": 132.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9428724646568298, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 142.49, "r": 545.115, "b": 151.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.987194836139679, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 231.79999999999995, "r": 286.365, "b": 240.35199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9855920076370239, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 333.838, "r": 391.492, "b": 342.39, "coord_origin": "TOPLEFT"}, "confidence": 0.9869040250778198, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 62.067, "t": 375.715, "r": 286.365, "b": 384.267, "coord_origin": "TOPLEFT"}, "confidence": 0.9820111393928528, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 61.569, "t": 444.82, "r": 65.056, "b": 453.372, "coord_origin": "TOPLEFT"}, "confidence": 0.9822162389755249, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 453.068, "r": 423.262, "b": 462.024, "coord_origin": "TOPLEFT"}, "confidence": 0.9843218326568604, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 61.569, "t": 502.422, "r": 65.056, "b": 510.974, "coord_origin": "TOPLEFT"}, "confidence": 0.982271671295166, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 61.569, "t": 560.025, "r": 65.056, "b": 568.577, "coord_origin": "TOPLEFT"}, "confidence": 0.9802963733673096, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 61.569, "t": 605.672, "r": 65.056, "b": 614.2239999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9806395173072815, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 650.867, "r": 204.452, "b": 659.419, "coord_origin": "TOPLEFT"}, "confidence": 0.9742533564567566, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "footnote", "bbox": {"l": 60.971, "t": 704.296, "r": 63.96, "b": 709.427, "coord_origin": "TOPLEFT"}, "confidence": 0.895367443561554, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8778094053268433, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 12, "page_no": 1, "cluster": {"id": 12, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9656890034675598, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "considered as a solved problem, given enough ground-truth"}, {"label": "text", "id": 10, "page_no": 1, "cluster": {"id": 10, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9774322509765625, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "its results & performance in Sec. 5. As a conclusion, we de-"}, {"label": "text", "id": 4, "page_no": 1, "cluster": {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 99.84000000000003, "r": 286.365, "b": 108.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9838606119155884, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The second problem is called table-structure decompo-"}, {"label": "section_header", "id": 13, "page_no": 1, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 308.862, "t": 121.73199999999997, "r": 498.28, "b": 132.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9428724646568298, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Previous work and State of the Art"}, {"label": "text", "id": 0, "page_no": 1, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 142.49, "r": 545.115, "b": 151.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.987194836139679, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Identifying the structure of a table has been an outstand-"}, {"label": "text", "id": 2, "page_no": 1, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 231.79999999999995, "r": 286.365, "b": 240.35199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9855920076370239, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we want to address these weaknesses and"}, {"label": "text", "id": 1, "page_no": 1, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 333.838, "r": 391.492, "b": 342.39, "coord_origin": "TOPLEFT"}, "confidence": 0.9869040250778198, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Before the rising"}, {"label": "text", "id": 7, "page_no": 1, "cluster": {"id": 7, "label": "text", "bbox": {"l": 62.067, "t": 375.715, "r": 286.365, "b": 384.267, "coord_origin": "TOPLEFT"}, "confidence": 0.9820111393928528, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To meet the design criteria listed above, we developed a"}, {"label": "list_item", "id": 6, "page_no": 1, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 61.569, "t": 444.82, "r": 65.056, "b": 453.372, "coord_origin": "TOPLEFT"}, "confidence": 0.9822162389755249, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "text", "id": 3, "page_no": 1, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 453.068, "r": 423.262, "b": 462.024, "coord_origin": "TOPLEFT"}, "confidence": 0.9843218326568604, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image-to-Text networks"}, {"label": "list_item", "id": 5, "page_no": 1, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 61.569, "t": 502.422, "r": 65.056, "b": 510.974, "coord_origin": "TOPLEFT"}, "confidence": 0.982271671295166, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "list_item", "id": 9, "page_no": 1, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 61.569, "t": 560.025, "r": 65.056, "b": 568.577, "coord_origin": "TOPLEFT"}, "confidence": 0.9802963733673096, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "list_item", "id": 8, "page_no": 1, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 61.569, "t": 605.672, "r": 65.056, "b": 614.2239999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9806395173072815, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "text", "id": 11, "page_no": 1, "cluster": {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 650.867, "r": 204.452, "b": 659.419, "coord_origin": "TOPLEFT"}, "confidence": 0.9742533564567566, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The paper is structured as follows."}, {"label": "footnote", "id": 14, "page_no": 1, "cluster": {"id": 14, "label": "footnote", "bbox": {"l": 60.971, "t": 704.296, "r": 63.96, "b": 709.427, "coord_origin": "TOPLEFT"}, "confidence": 0.895367443561554, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1"}, {"label": "page_footer", "id": 15, "page_no": 1, "cluster": {"id": 15, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8778094053268433, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2"}], "body": [{"label": "text", "id": 12, "page_no": 1, "cluster": {"id": 12, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9656890034675598, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "considered as a solved problem, given enough ground-truth"}, {"label": "text", "id": 10, "page_no": 1, "cluster": {"id": 10, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9774322509765625, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "its results & performance in Sec. 5. As a conclusion, we de-"}, {"label": "text", "id": 4, "page_no": 1, "cluster": {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 99.84000000000003, "r": 286.365, "b": 108.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9838606119155884, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The second problem is called table-structure decompo-"}, {"label": "section_header", "id": 13, "page_no": 1, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 308.862, "t": 121.73199999999997, "r": 498.28, "b": 132.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9428724646568298, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Previous work and State of the Art"}, {"label": "text", "id": 0, "page_no": 1, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 142.49, "r": 545.115, "b": 151.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.987194836139679, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Identifying the structure of a table has been an outstand-"}, {"label": "text", "id": 2, "page_no": 1, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 231.79999999999995, "r": 286.365, "b": 240.35199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9855920076370239, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we want to address these weaknesses and"}, {"label": "text", "id": 1, "page_no": 1, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 333.838, "r": 391.492, "b": 342.39, "coord_origin": "TOPLEFT"}, "confidence": 0.9869040250778198, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Before the rising"}, {"label": "text", "id": 7, "page_no": 1, "cluster": {"id": 7, "label": "text", "bbox": {"l": 62.067, "t": 375.715, "r": 286.365, "b": 384.267, "coord_origin": "TOPLEFT"}, "confidence": 0.9820111393928528, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To meet the design criteria listed above, we developed a"}, {"label": "list_item", "id": 6, "page_no": 1, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 61.569, "t": 444.82, "r": 65.056, "b": 453.372, "coord_origin": "TOPLEFT"}, "confidence": 0.9822162389755249, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "text", "id": 3, "page_no": 1, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 453.068, "r": 423.262, "b": 462.024, "coord_origin": "TOPLEFT"}, "confidence": 0.9843218326568604, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image-to-Text networks"}, {"label": "list_item", "id": 5, "page_no": 1, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 61.569, "t": 502.422, "r": 65.056, "b": 510.974, "coord_origin": "TOPLEFT"}, "confidence": 0.982271671295166, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "list_item", "id": 9, "page_no": 1, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 61.569, "t": 560.025, "r": 65.056, "b": 568.577, "coord_origin": "TOPLEFT"}, "confidence": 0.9802963733673096, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "list_item", "id": 8, "page_no": 1, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 61.569, "t": 605.672, "r": 65.056, "b": 614.2239999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9806395173072815, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "text", "id": 11, "page_no": 1, "cluster": {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 650.867, "r": 204.452, "b": 659.419, "coord_origin": "TOPLEFT"}, "confidence": 0.9742533564567566, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The paper is structured as follows."}, {"label": "footnote", "id": 14, "page_no": 1, "cluster": {"id": 14, "label": "footnote", "bbox": {"l": 60.971, "t": 704.296, "r": 63.96, "b": 709.427, "coord_origin": "TOPLEFT"}, "confidence": 0.895367443561554, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1"}], "headers": [{"label": "page_footer", "id": 15, "page_no": 1, "cluster": {"id": 15, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8778094053268433, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2"}]}}, {"page_no": 2, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.931, "r_y0": 96.03999999999996, "r_x1": 110.953, "r_y1": 96.03999999999996, "r_x2": 110.953, "r_y2": 87.48800000000006, "r_x3": 76.931, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.545, "r_y0": 96.03999999999996, "r_x1": 136.258, "r_y1": 96.03999999999996, "r_x2": 136.258, "r_y2": 87.48800000000006, "r_x3": 118.545, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.824, "r_y0": 96.03999999999996, "r_x1": 175.372, "r_y1": 96.03999999999996, "r_x2": 175.372, "r_y2": 87.48800000000006, "r_x3": 142.824, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 96.03999999999996, "r_x1": 232.836, "r_y1": 96.03999999999996, "r_x2": 232.836, "r_y2": 87.48800000000006, "r_x3": 181.947, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.411, "r_y0": 96.03999999999996, "r_x1": 265.414, "r_y1": 96.03999999999996, "r_x2": 265.414, "r_y2": 87.48800000000006, "r_x3": 239.411, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.979, "r_y0": 96.03999999999996, "r_x1": 286.365, "r_y1": 96.03999999999996, "r_x2": 286.365, "r_y2": 87.48800000000006, "r_x3": 271.979, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.995, "r_x1": 286.365, "r_y1": 107.995, "r_x2": 286.365, "r_y2": 99.44299999999998, "r_x3": 50.112, "r_y3": 99.44299999999998, "coord_origin": "TOPLEFT"}, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.95100000000002, "r_x1": 286.365, "r_y1": 119.95100000000002, "r_x2": 286.365, "r_y2": 111.399, "r_x3": 50.112, "r_y3": 111.399, "coord_origin": "TOPLEFT"}, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.90599999999995, "r_x1": 286.365, "r_y1": 131.90599999999995, "r_x2": 286.365, "r_y2": 123.35400000000004, "r_x3": 50.112, "r_y3": 123.35400000000004, "coord_origin": "TOPLEFT"}, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.861, "r_x1": 286.365, "r_y1": 143.861, "r_x2": 286.365, "r_y2": 135.30899999999997, "r_x3": 50.112, "r_y3": 135.30899999999997, "coord_origin": "TOPLEFT"}, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.81600000000003, "r_x1": 174.206, "r_y1": 155.81600000000003, "r_x2": 174.206, "r_y2": 147.264, "r_x3": 50.112, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "bedded in the content-decoder.", "orig": "bedded in the content-decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.098, "r_y0": 155.81600000000003, "r_x1": 286.365, "r_y1": 155.81600000000003, "r_x2": 286.365, "r_y2": 147.264, "r_x3": 179.098, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "This reliance on a custom,", "orig": "This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 167.77099999999996, "r_x1": 243.267, "r_y1": 167.77099999999996, "r_x2": 243.267, "r_y2": 159.21900000000005, "r_x3": 50.112, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "implicit OCR decoder is of course problematic.", "orig": "implicit OCR decoder is of course problematic.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.437, "r_y0": 167.77099999999996, "r_x1": 286.365, "r_y1": 167.77099999999996, "r_x2": 286.365, "r_y2": 159.21900000000005, "r_x3": 248.437, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "OCR is a", "orig": "OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 179.726, "r_x1": 286.365, "r_y1": 179.726, "r_x2": 286.365, "r_y2": 171.17399999999998, "r_x3": 50.112, "r_y3": 171.17399999999998, "coord_origin": "TOPLEFT"}, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 191.68200000000002, "r_x1": 286.365, "r_y1": 191.68200000000002, "r_x2": 286.365, "r_y2": 183.13, "r_x3": 50.112, "r_y3": 183.13, "coord_origin": "TOPLEFT"}, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 203.63699999999994, "r_x1": 126.655, "r_y1": 203.63699999999994, "r_x2": 126.655, "r_y2": 195.08500000000004, "r_x3": 50.112, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "limited availability", "orig": "limited availability", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.59, "r_y0": 203.63699999999994, "r_x1": 142.206, "r_y1": 203.63699999999994, "r_x2": 142.206, "r_y2": 195.08500000000004, "r_x3": 130.59, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.132, "r_y0": 203.63699999999994, "r_x1": 286.365, "r_y1": 203.63699999999994, "r_x2": 286.365, "r_y2": 195.08500000000004, "r_x3": 146.132, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "non-english content in the current", "orig": "non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.59199999999998, "r_x1": 286.365, "r_y1": 215.59199999999998, "r_x2": 286.365, "r_y2": 207.03999999999996, "r_x3": 50.112, "r_y3": 207.03999999999996, "coord_origin": "TOPLEFT"}, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.54700000000003, "r_x1": 286.365, "r_y1": 227.54700000000003, "r_x2": 286.365, "r_y2": 218.995, "r_x3": 50.112, "r_y3": 218.995, "coord_origin": "TOPLEFT"}, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 239.50199999999995, "r_x1": 286.365, "r_y1": 239.50199999999995, "r_x2": 286.365, "r_y2": 230.95000000000005, "r_x3": 50.112, "r_y3": 230.95000000000005, "coord_origin": "TOPLEFT"}, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 251.457, "r_x1": 286.365, "r_y1": 251.457, "r_x2": 286.365, "r_y2": 242.90499999999997, "r_x3": 50.112, "r_y3": 242.90499999999997, "coord_origin": "TOPLEFT"}, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 263.413, "r_x1": 66.989, "r_y1": 263.413, "r_x2": 66.989, "r_y2": 254.861, "r_x3": 50.112, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.382, "r_y0": 263.413, "r_x1": 286.365, "r_y1": 263.413, "r_x2": 286.365, "r_y2": 254.861, "r_x3": 71.382, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "The latter was the inspiration for the work of this pa-", "orig": "The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 275.36800000000005, "r_x1": 64.777, "r_y1": 275.36800000000005, "r_x2": 64.777, "r_y2": 266.81600000000003, "r_x3": 50.112, "r_y3": 266.81600000000003, "coord_origin": "TOPLEFT"}, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.677, "r_y0": 287.395, "r_x1": 126.007, "r_y1": 287.395, "r_x2": 126.007, "r_y2": 278.43899999999996, "r_x3": 96.677, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.373, "r_y0": 287.395, "r_x1": 171.566, "r_y1": 287.395, "r_x2": 171.566, "r_y2": 278.43899999999996, "r_x3": 132.373, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.568, "r_y0": 287.379, "r_x1": 174.338, "r_y1": 287.379, "r_x2": 174.338, "r_y2": 278.827, "r_x3": 171.568, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.187, "r_y0": 287.379, "r_x1": 210.083, "r_y1": 287.379, "r_x2": 210.083, "r_y2": 278.827, "r_x3": 185.187, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.459, "r_y0": 287.379, "r_x1": 243.568, "r_y1": 287.379, "r_x2": 243.568, "r_y2": 278.827, "r_x3": 216.459, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.944, "r_y0": 287.379, "r_x1": 286.357, "r_y1": 287.379, "r_x2": 286.357, "r_y2": 278.827, "r_x3": 249.944, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.335, "r_x1": 84.971, "r_y1": 299.335, "r_x2": 84.971, "r_y2": 290.783, "r_x3": 50.112, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "(GNN's)", "orig": "(GNN's)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.347, "r_y0": 299.335, "r_x1": 107.845, "r_y1": 299.335, "r_x2": 107.845, "r_y2": 290.783, "r_x3": 91.347, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "take", "orig": "take", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.211, "r_y0": 299.335, "r_x1": 118.635, "r_y1": 299.335, "r_x2": 118.635, "r_y2": 290.783, "r_x3": 114.211, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.011, "r_y0": 299.335, "r_x1": 159.87, "r_y1": 299.335, "r_x2": 159.87, "r_y2": 290.783, "r_x3": 125.011, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "radically", "orig": "radically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.246, "r_y0": 299.335, "r_x1": 200.298, "r_y1": 299.335, "r_x2": 200.298, "r_y2": 290.783, "r_x3": 166.246, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.664, "r_y0": 299.335, "r_x1": 243.177, "r_y1": 299.335, "r_x2": 243.177, "r_y2": 290.783, "r_x3": 206.664, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "approach", "orig": "approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.553, "r_y0": 299.335, "r_x1": 257.304, "r_y1": 299.335, "r_x2": 257.304, "r_y2": 290.783, "r_x3": 249.553, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.68, "r_y0": 299.335, "r_x1": 286.365, "r_y1": 299.335, "r_x2": 286.365, "r_y2": 290.783, "r_x3": 263.68, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "table-", "orig": "table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.29, "r_x1": 84.971, "r_y1": 311.29, "r_x2": 84.971, "r_y2": 302.738, "r_x3": 50.112, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.986, "r_y0": 311.29, "r_x1": 131.168, "r_y1": 311.29, "r_x2": 131.168, "r_y2": 302.738, "r_x3": 88.986, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "extraction.", "orig": "extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.849, "r_y0": 311.29, "r_x1": 286.365, "r_y1": 311.29, "r_x2": 286.365, "r_y2": 302.738, "r_x3": 138.849, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.245, "r_x1": 286.365, "r_y1": 323.245, "r_x2": 286.365, "r_y2": 314.693, "r_x3": 50.112, "r_y3": 314.693, "coord_origin": "TOPLEFT"}, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.2, "r_x1": 136.996, "r_y1": 335.2, "r_x2": 136.996, "r_y2": 326.648, "r_x3": 50.112, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "one creates an initial", "orig": "one creates an initial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.051, "r_y0": 335.2, "r_x1": 166.226, "r_y1": 335.2, "r_x2": 166.226, "r_y2": 326.648, "r_x3": 141.051, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "graph,", "orig": "graph,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.679, "r_y0": 335.2, "r_x1": 286.365, "r_y1": 335.2, "r_x2": 286.365, "r_y2": 326.648, "r_x3": 170.679, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "where each of the text-cells", "orig": "where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.155, "r_x1": 260.442, "r_y1": 347.155, "r_x2": 260.442, "r_y2": 338.603, "r_x3": 50.112, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "becomes a node in the graph similar to [33, 34, 2].", "orig": "becomes a node in the graph similar to [33, 34, 2].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.45, "r_y0": 347.155, "r_x1": 286.365, "r_y1": 347.155, "r_x2": 286.365, "r_y2": 338.603, "r_x3": 266.45, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "Each", "orig": "Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.11, "r_x1": 286.365, "r_y1": 359.11, "r_x2": 286.365, "r_y2": 350.558, "r_x3": 50.112, "r_y3": 350.558, "coord_origin": "TOPLEFT"}, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.066, "r_x1": 286.365, "r_y1": 371.066, "r_x2": 286.365, "r_y2": 362.514, "r_x3": 50.112, "r_y3": 362.514, "coord_origin": "TOPLEFT"}, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.021, "r_x1": 67.397, "r_y1": 383.021, "r_x2": 67.397, "r_y2": 374.469, "r_x3": 50.112, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "text.", "orig": "text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 72.976, "r_y0": 383.021, "r_x1": 286.365, "r_y1": 383.021, "r_x2": 286.365, "r_y2": 374.469, "r_x3": 72.976, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "Furthermore, nodes that represent adjacent text-cells", "orig": "Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 394.976, "r_x1": 92.602, "r_y1": 394.976, "r_x2": 92.602, "r_y2": 386.424, "r_x3": 50.112, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "are linked.", "orig": "are linked.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.305, "r_y0": 394.976, "r_x1": 286.365, "r_y1": 394.976, "r_x2": 286.365, "r_y2": 386.424, "r_x3": 97.305, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "Graph Convolutional Networks (GCN's) based", "orig": "Graph Convolutional Networks (GCN's) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 406.931, "r_x1": 286.365, "r_y1": 406.931, "r_x2": 286.365, "r_y2": 398.379, "r_x3": 50.112, "r_y3": 398.379, "coord_origin": "TOPLEFT"}, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 418.886, "r_x1": 286.365, "r_y1": 418.886, "r_x2": 286.365, "r_y2": 410.334, "r_x3": 50.112, "r_y3": 410.334, "coord_origin": "TOPLEFT"}, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 430.841, "r_x1": 286.365, "r_y1": 430.841, "r_x2": 286.365, "r_y2": 422.289, "r_x3": 50.112, "r_y3": 422.289, "coord_origin": "TOPLEFT"}, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 442.797, "r_x1": 198.236, "r_y1": 442.797, "r_x2": 198.236, "r_y2": 434.245, "r_x3": 50.112, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.927, "r_y0": 442.797, "r_x1": 286.365, "r_y1": 442.797, "r_x2": 286.365, "r_y2": 434.245, "r_x3": 205.927, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 454.752, "r_x1": 165.618, "r_y1": 454.752, "r_x2": 165.618, "r_y2": 446.2, "r_x3": 50.112, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "represent the table-structure.", "orig": "represent the table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.417, "r_y0": 454.752, "r_x1": 286.365, "r_y1": 454.752, "r_x2": 286.365, "r_y2": 446.2, "r_x3": 171.417, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "With this approach, one can", "orig": "With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 466.707, "r_x1": 242.36, "r_y1": 466.707, "r_x2": 242.36, "r_y2": 458.155, "r_x3": 50.112, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "avoid the need to build custom OCR decoders.", "orig": "avoid the need to build custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.408, "r_y0": 466.707, "r_x1": 286.365, "r_y1": 466.707, "r_x2": 286.365, "r_y2": 458.155, "r_x3": 248.408, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "However,", "orig": "However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 478.662, "r_x1": 286.365, "r_y1": 478.662, "r_x2": 286.365, "r_y2": 470.11, "r_x3": 50.112, "r_y3": 470.11, "coord_origin": "TOPLEFT"}, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 490.617, "r_x1": 186.5, "r_y1": 490.617, "r_x2": 186.5, "r_y2": 482.065, "r_x3": 50.112, "r_y3": 482.065, "coord_origin": "TOPLEFT"}, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.882, "r_y0": 502.629, "r_x1": 255.652, "r_y1": 502.629, "r_x2": 255.652, "r_y2": 494.077, "r_x3": 252.882, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.63, "r_y0": 502.629, "r_x1": 286.366, "r_y1": 502.629, "r_x2": 286.366, "r_y2": 494.077, "r_x3": 258.63, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": "Apop-", "orig": "Apop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.5840000000001, "r_x1": 286.365, "r_y1": 514.5840000000001, "r_x2": 286.365, "r_y2": 506.032, "r_x3": 50.112, "r_y3": 506.032, "coord_origin": "TOPLEFT"}, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 526.539, "r_x1": 286.365, "r_y1": 526.539, "r_x2": 286.365, "r_y2": 517.9870000000001, "r_x3": 50.112, "r_y3": 517.9870000000001, "coord_origin": "TOPLEFT"}, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 538.494, "r_x1": 286.365, "r_y1": 538.494, "r_x2": 286.365, "r_y2": 529.942, "r_x3": 50.112, "r_y3": 529.942, "coord_origin": "TOPLEFT"}, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.45, "r_x1": 286.365, "r_y1": 550.45, "r_x2": 286.365, "r_y2": 541.898, "r_x3": 50.112, "r_y3": 541.898, "coord_origin": "TOPLEFT"}, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 562.405, "r_x1": 286.365, "r_y1": 562.405, "r_x2": 286.365, "r_y2": 553.8530000000001, "r_x3": 50.112, "r_y3": 553.8530000000001, "coord_origin": "TOPLEFT"}, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 574.36, "r_x1": 59.527, "r_y1": 574.36, "r_x2": 59.527, "r_y2": 565.808, "r_x3": 50.112, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "its", "orig": "its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.259, "r_y0": 574.36, "r_x1": 95.8, "r_y1": 574.36, "r_x2": 95.8, "r_y2": 565.808, "r_x3": 64.259, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "images)", "orig": "images)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.523, "r_y0": 574.36, "r_x1": 145.105, "r_y1": 574.36, "r_x2": 145.105, "r_y2": 565.808, "r_x3": 100.523, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "and finally", "orig": "and finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.828, "r_y0": 574.36, "r_x1": 166.983, "r_y1": 574.36, "r_x2": 166.983, "r_y2": 565.808, "r_x3": 149.828, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "uses", "orig": "uses", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.715, "r_y0": 574.36, "r_x1": 205.768, "r_y1": 574.36, "r_x2": 205.768, "r_y2": 565.808, "r_x3": 171.715, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.5, "r_y0": 574.36, "r_x1": 244.243, "r_y1": 574.36, "r_x2": 244.243, "r_y2": 565.808, "r_x3": 210.5, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "rule-sets", "orig": "rule-sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.975, "r_y0": 574.36, "r_x1": 256.726, "r_y1": 574.36, "r_x2": 256.726, "r_y2": 565.808, "r_x3": 248.975, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.459, "r_y0": 574.36, "r_x1": 286.365, "r_y1": 574.36, "r_x2": 286.365, "r_y2": 565.808, "r_x3": 261.459, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "obtain", "orig": "obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.315, "r_x1": 122.64, "r_y1": 586.315, "r_x2": 122.64, "r_y2": 577.763, "r_x3": 50.112, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "its table-structure.", "orig": "its table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.482, "r_y0": 586.315, "r_x1": 286.365, "r_y1": 586.315, "r_x2": 286.365, "r_y2": 577.763, "r_x3": 127.482, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "Currently, this approach achieves state-", "orig": "Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 598.27, "r_x1": 87.731, "r_y1": 598.27, "r_x2": 87.731, "r_y2": 589.718, "r_x3": 50.112, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "of-the-art", "orig": "of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.074, "r_y0": 598.27, "r_x1": 120.577, "r_y1": 598.27, "r_x2": 120.577, "r_y2": 589.718, "r_x3": 92.074, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "results,", "orig": "results,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.389, "r_y0": 598.27, "r_x1": 137.922, "r_y1": 598.27, "r_x2": 137.922, "r_y2": 589.718, "r_x3": 125.389, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "but", "orig": "but", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.266, "r_y0": 598.27, "r_x1": 148.911, "r_y1": 598.27, "r_x2": 148.911, "r_y2": 589.718, "r_x3": 142.266, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.255, "r_y0": 598.27, "r_x1": 165.987, "r_y1": 598.27, "r_x2": 165.987, "r_y2": 589.718, "r_x3": 153.255, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "not", "orig": "not", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.331, "r_y0": 598.27, "r_x1": 286.365, "r_y1": 598.27, "r_x2": 286.365, "r_y2": 589.718, "r_x3": 170.331, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "an end-to-end deep-learning", "orig": "an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 610.225, "r_x1": 82.49, "r_y1": 610.225, "r_x2": 82.49, "r_y2": 601.673, "r_x3": 50.112, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.173, "r_y0": 610.225, "r_x1": 286.365, "r_y1": 610.225, "r_x2": 286.365, "r_y2": 601.673, "r_x3": 87.173, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "As such, new rules need to be written if different", "orig": "As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 622.181, "r_x1": 175.989, "r_y1": 622.181, "r_x2": 175.989, "r_y2": 613.629, "r_x3": 50.112, "r_y3": 613.629, "coord_origin": "TOPLEFT"}, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 133.479, "r_y1": 689.156, "r_x2": 133.479, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "evaluate our models.", "orig": "evaluate our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.271, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 138.271, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "These datasets span over various ap-", "orig": "These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 166.246, "r_y1": 701.111, "r_x2": 166.246, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.688, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 173.688, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.491, "r_y0": 276.65700000000004, "r_x1": 545.115, "r_y1": 276.65700000000004, "r_x2": 545.115, "r_y2": 268.105, "r_x3": 354.491, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 288.612, "r_x1": 498.57, "r_y1": 288.612, "r_x2": 498.57, "r_y2": 280.06, "r_x3": 308.862, "r_y3": 280.06, "coord_origin": "TOPLEFT"}, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 352.307, "r_x1": 545.115, "r_y1": 352.307, "r_x2": 545.115, "r_y2": 343.755, "r_x3": 308.862, "r_y3": 343.755, "coord_origin": "TOPLEFT"}, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 364.263, "r_x1": 545.115, "r_y1": 364.263, "r_x2": 545.115, "r_y2": 355.711, "r_x3": 308.862, "r_y3": 355.711, "coord_origin": "TOPLEFT"}, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.218, "r_x1": 545.115, "r_y1": 376.218, "r_x2": 545.115, "r_y2": 367.666, "r_x3": 308.862, "r_y3": 367.666, "coord_origin": "TOPLEFT"}, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.173, "r_x1": 545.115, "r_y1": 388.173, "r_x2": 545.115, "r_y2": 379.621, "r_x3": 308.862, "r_y3": 379.621, "coord_origin": "TOPLEFT"}, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.128, "r_x1": 545.115, "r_y1": 400.128, "r_x2": 545.115, "r_y2": 391.576, "r_x3": 308.862, "r_y3": 391.576, "coord_origin": "TOPLEFT"}, "text": "a table is characterized as 'simple' when it does not contain", "orig": "a table is characterized as 'simple' when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.083, "r_x1": 545.115, "r_y1": 412.083, "r_x2": 545.115, "r_y2": 403.531, "r_x3": 308.862, "r_y3": 403.531, "coord_origin": "TOPLEFT"}, "text": "row spans or column spans, otherwise it is 'complex'. The", "orig": "row spans or column spans, otherwise it is 'complex'. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.038, "r_x1": 545.115, "r_y1": 424.038, "r_x2": 545.115, "r_y2": 415.486, "r_x3": 308.862, "r_y3": 415.486, "coord_origin": "TOPLEFT"}, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.994, "r_x1": 545.115, "r_y1": 435.994, "r_x2": 545.115, "r_y2": 427.442, "r_x3": 308.862, "r_y3": 427.442, "coord_origin": "TOPLEFT"}, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.949, "r_x1": 545.115, "r_y1": 447.949, "r_x2": 545.115, "r_y2": 439.397, "r_x3": 308.862, "r_y3": 439.397, "coord_origin": "TOPLEFT"}, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.904, "r_x1": 545.115, "r_y1": 459.904, "r_x2": 545.115, "r_y2": 451.352, "r_x3": 308.862, "r_y3": 451.352, "coord_origin": "TOPLEFT"}, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 471.859, "r_x1": 545.115, "r_y1": 471.859, "r_x2": 545.115, "r_y2": 463.307, "r_x3": 308.862, "r_y3": 463.307, "coord_origin": "TOPLEFT"}, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 483.814, "r_x1": 358.984, "r_y1": 483.814, "r_x2": 358.984, "r_y2": 475.262, "r_x3": 308.862, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "text content.", "orig": "text content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.121, "r_y0": 483.814, "r_x1": 545.115, "r_y1": 483.814, "r_x2": 545.115, "r_y2": 475.262, "r_x3": 365.121, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "Similarly to the PubTabNet, the annotations", "orig": "Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 495.77, "r_x1": 545.115, "r_y1": 495.77, "r_x2": 545.115, "r_y2": 487.218, "r_x3": 308.862, "r_y3": 487.218, "coord_origin": "TOPLEFT"}, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 507.725, "r_x1": 545.115, "r_y1": 507.725, "r_x2": 545.115, "r_y2": 499.173, "r_x3": 308.862, "r_y3": 499.173, "coord_origin": "TOPLEFT"}, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 519.6800000000001, "r_x1": 545.115, "r_y1": 519.6800000000001, "r_x2": 545.115, "r_y2": 511.128, "r_x3": 308.862, "r_y3": 511.128, "coord_origin": "TOPLEFT"}, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.635, "r_x1": 545.115, "r_y1": 531.635, "r_x2": 545.115, "r_y2": 523.0830000000001, "r_x3": 308.862, "r_y3": 523.0830000000001, "coord_origin": "TOPLEFT"}, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.59, "r_x1": 545.115, "r_y1": 543.59, "r_x2": 545.115, "r_y2": 535.038, "r_x3": 308.862, "r_y3": 535.038, "coord_origin": "TOPLEFT"}, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.545, "r_x1": 350.964, "r_y1": 555.545, "r_x2": 350.964, "r_y2": 546.9929999999999, "r_x3": 308.862, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "plex, Test:", "orig": "plex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.467, "r_y0": 555.545, "r_x1": 490.082, "r_y1": 555.545, "r_x2": 490.082, "r_y2": 546.9929999999999, "r_x3": 355.467, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "48% simple, 52% complex, Test:", "orig": "48% simple, 52% complex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.595, "r_y0": 555.545, "r_x1": 545.115, "r_y1": 555.545, "r_x2": 545.115, "r_y2": 546.9929999999999, "r_x3": 494.595, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "53% simple,", "orig": "53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.501, "r_x1": 370.6, "r_y1": 567.501, "r_x2": 370.6, "r_y2": 558.9490000000001, "r_x3": 308.862, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "47% complex).", "orig": "47% complex).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.737, "r_y0": 567.501, "r_x1": 545.115, "r_y1": 567.501, "r_x2": 545.115, "r_y2": 558.9490000000001, "r_x3": 376.737, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "Finally the TableBank dataset consists of", "orig": "Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 579.456, "r_x1": 545.115, "r_y1": 579.456, "r_x2": 545.115, "r_y2": 570.904, "r_x3": 308.862, "r_y3": 570.904, "coord_origin": "TOPLEFT"}, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 591.4110000000001, "r_x1": 545.115, "r_y1": 591.4110000000001, "r_x2": 545.115, "r_y2": 582.859, "r_x3": 308.862, "r_y3": 582.859, "coord_origin": "TOPLEFT"}, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 603.366, "r_x1": 403.726, "r_y1": 603.366, "r_x2": 403.726, "r_y2": 594.814, "r_x3": 308.862, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "boxes of the table cells.", "orig": "boxes of the table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.731, "r_y0": 603.366, "r_x1": 545.115, "r_y1": 603.366, "r_x2": 545.115, "r_y2": 594.814, "r_x3": 407.731, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "The entire dataset consists of sim-", "orig": "The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 615.321, "r_x1": 545.115, "r_y1": 615.321, "r_x2": 545.115, "r_y2": 606.769, "r_x3": 308.862, "r_y3": 606.769, "coord_origin": "TOPLEFT"}, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 627.2760000000001, "r_x1": 348.164, "r_y1": 627.2760000000001, "r_x2": 348.164, "r_y2": 618.7239999999999, "r_x3": 308.862, "r_y3": 618.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.245, "r_x1": 545.115, "r_y1": 665.245, "r_x2": 545.115, "r_y2": 656.693, "r_x3": 308.862, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 361.245, "r_y1": 677.201, "r_x2": 361.245, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "cal purposes.", "orig": "cal purposes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.44, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 365.44, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "Given the size of PubTabNet, we adopted its", "orig": "Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 487.322, "r_y1": 701.111, "r_x2": 487.322, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "as PNG images with a resolution of 72 dpi.", "orig": "as PNG images with a resolution of 72 dpi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.901, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 492.901, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 250.151, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.8767216801643372, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "picture", "bbox": {"l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT"}, "confidence": 0.9746918082237244, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 12, "label": "section_header", "bbox": {"l": 380.799, "t": 80.154, "r": 486.849, "b": 88.46699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.5687217116355896, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 5, "label": "text", "bbox": {"l": 62.067, "t": 87.48800000000006, "r": 70.366, "b": 96.03999999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9822593927383423, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "caption", "bbox": {"l": 308.862, "t": 268.105, "r": 346.062, "b": 276.65700000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9667505025863647, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 278.43899999999996, "r": 90.301, "b": 287.395, "coord_origin": "TOPLEFT"}, "confidence": 0.9878450036048889, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 317.742, "r": 437.27, "b": 326.294, "coord_origin": "TOPLEFT"}, "confidence": 0.8879811763763428, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 331.8, "r": 545.115, "b": 340.352, "coord_origin": "TOPLEFT"}, "confidence": 0.9870319366455078, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 493.689, "r": 252.881, "b": 502.645, "coord_origin": "TOPLEFT"}, "confidence": 0.9875094294548035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 320.817, "t": 632.783, "r": 545.115, "b": 641.335, "coord_origin": "TOPLEFT"}, "confidence": 0.9840091466903687, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "section_header", "bbox": {"l": 50.112, "t": 635.9449999999999, "r": 105.225, "b": 646.693, "coord_origin": "TOPLEFT"}, "confidence": 0.9423062205314636, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 656.694, "r": 286.365, "b": 665.246, "coord_origin": "TOPLEFT"}, "confidence": 0.9862047433853149, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8715606927871704, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 10, "page_no": 2, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 250.151, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.8767216801643372, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tag-decoder which is constrained to the table-tags."}, {"label": "picture", "id": 6, "page_no": 2, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT"}, "confidence": 0.9746918082237244, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 12, "label": "section_header", "bbox": {"l": 380.799, "t": 80.154, "r": 486.849, "b": 88.46699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.5687217116355896, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 5, "page_no": 2, "cluster": {"id": 5, "label": "text", "bbox": {"l": 62.067, "t": 87.48800000000006, "r": 70.366, "b": 96.03999999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9822593927383423, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In"}, {"label": "caption", "id": 7, "page_no": 2, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 308.862, "t": 268.105, "r": 346.062, "b": 276.65700000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9667505025863647, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 2:"}, {"label": "text", "id": 0, "page_no": 2, "cluster": {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 278.43899999999996, "r": 90.301, "b": 287.395, "coord_origin": "TOPLEFT"}, "confidence": 0.9878450036048889, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Graph"}, {"label": "text", "id": 9, "page_no": 2, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 317.742, "r": 437.27, "b": 326.294, "coord_origin": "TOPLEFT"}, "confidence": 0.8879811763763428, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "balance in the previous datasets."}, {"label": "text", "id": 2, "page_no": 2, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 331.8, "r": 545.115, "b": 340.352, "coord_origin": "TOPLEFT"}, "confidence": 0.9870319366455078, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The PubTabNet dataset contains 509k tables delivered as"}, {"label": "text", "id": 1, "page_no": 2, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 493.689, "r": 252.881, "b": 502.645, "coord_origin": "TOPLEFT"}, "confidence": 0.9875094294548035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Hybrid Deep Learning-Rule-Based approach"}, {"label": "text", "id": 4, "page_no": 2, "cluster": {"id": 4, "label": "text", "bbox": {"l": 320.817, "t": 632.783, "r": 545.115, "b": 641.335, "coord_origin": "TOPLEFT"}, "confidence": 0.9840091466903687, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Due to the heterogeneity across the dataset formats, it"}, {"label": "section_header", "id": 8, "page_no": 2, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 50.112, "t": 635.9449999999999, "r": 105.225, "b": 646.693, "coord_origin": "TOPLEFT"}, "confidence": 0.9423062205314636, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Datasets"}, {"label": "text", "id": 3, "page_no": 2, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 656.694, "r": 286.365, "b": 665.246, "coord_origin": "TOPLEFT"}, "confidence": 0.9862047433853149, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We rely on large-scale datasets such as PubTabNet [37],"}, {"label": "page_footer", "id": 11, "page_no": 2, "cluster": {"id": 11, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8715606927871704, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3"}], "body": [{"label": "text", "id": 10, "page_no": 2, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 250.151, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.8767216801643372, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tag-decoder which is constrained to the table-tags."}, {"label": "picture", "id": 6, "page_no": 2, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT"}, "confidence": 0.9746918082237244, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 12, "label": "section_header", "bbox": {"l": 380.799, "t": 80.154, "r": 486.849, "b": 88.46699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.5687217116355896, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 5, "page_no": 2, "cluster": {"id": 5, "label": "text", "bbox": {"l": 62.067, "t": 87.48800000000006, "r": 70.366, "b": 96.03999999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9822593927383423, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In"}, {"label": "caption", "id": 7, "page_no": 2, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 308.862, "t": 268.105, "r": 346.062, "b": 276.65700000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9667505025863647, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 2:"}, {"label": "text", "id": 0, "page_no": 2, "cluster": {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 278.43899999999996, "r": 90.301, "b": 287.395, "coord_origin": "TOPLEFT"}, "confidence": 0.9878450036048889, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Graph"}, {"label": "text", "id": 9, "page_no": 2, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 317.742, "r": 437.27, "b": 326.294, "coord_origin": "TOPLEFT"}, "confidence": 0.8879811763763428, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "balance in the previous datasets."}, {"label": "text", "id": 2, "page_no": 2, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 331.8, "r": 545.115, "b": 340.352, "coord_origin": "TOPLEFT"}, "confidence": 0.9870319366455078, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The PubTabNet dataset contains 509k tables delivered as"}, {"label": "text", "id": 1, "page_no": 2, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 493.689, "r": 252.881, "b": 502.645, "coord_origin": "TOPLEFT"}, "confidence": 0.9875094294548035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Hybrid Deep Learning-Rule-Based approach"}, {"label": "text", "id": 4, "page_no": 2, "cluster": {"id": 4, "label": "text", "bbox": {"l": 320.817, "t": 632.783, "r": 545.115, "b": 641.335, "coord_origin": "TOPLEFT"}, "confidence": 0.9840091466903687, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Due to the heterogeneity across the dataset formats, it"}, {"label": "section_header", "id": 8, "page_no": 2, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 50.112, "t": 635.9449999999999, "r": 105.225, "b": 646.693, "coord_origin": "TOPLEFT"}, "confidence": 0.9423062205314636, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Datasets"}, {"label": "text", "id": 3, "page_no": 2, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 656.694, "r": 286.365, "b": 665.246, "coord_origin": "TOPLEFT"}, "confidence": 0.9862047433853149, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We rely on large-scale datasets such as PubTabNet [37],"}], "headers": [{"label": "page_footer", "id": 11, "page_no": 2, "cluster": {"id": 11, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8715606927871704, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3"}]}}, {"page_no": 3, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 212.283, "r_y1": 95.98400000000004, "r_x2": 212.283, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 121.73599999999999, "r_x1": 176.458, "r_y1": 121.73599999999999, "r_x2": 176.458, "r_y2": 113.18399999999997, "r_x3": 50.112, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "is essential to train our models.", "orig": "is essential to train our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.971, "r_y0": 121.73599999999999, "r_x1": 286.365, "r_y1": 121.73599999999999, "r_x2": 286.365, "r_y2": 113.18399999999997, "r_x3": 180.971, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "In order to distinguish be-", "orig": "In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 133.69100000000003, "r_x1": 286.365, "r_y1": 133.69100000000003, "r_x2": 286.365, "r_y2": 125.13900000000001, "r_x3": 50.112, "r_y3": 125.13900000000001, "coord_origin": "TOPLEFT"}, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 145.64700000000005, "r_x1": 286.365, "r_y1": 145.64700000000005, "r_x2": 286.365, "r_y2": 137.09500000000003, "r_x3": 50.112, "r_y3": 137.09500000000003, "coord_origin": "TOPLEFT"}, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 157.60199999999998, "r_x1": 286.365, "r_y1": 157.60199999999998, "r_x2": 286.365, "r_y2": 149.04999999999995, "r_x3": 50.112, "r_y3": 149.04999999999995, "coord_origin": "TOPLEFT"}, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 169.55700000000002, "r_x1": 94.127, "r_y1": 169.55700000000002, "r_x2": 94.127, "r_y2": 161.005, "r_x3": 50.112, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "tables (e.g.", "orig": "tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 98.959, "r_y0": 169.55700000000002, "r_x1": 286.365, "r_y1": 169.55700000000002, "r_x2": 286.365, "r_y2": 161.005, "r_x3": 98.959, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "TableBank) or they narrow their scope only to", "orig": "TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 181.51199999999994, "r_x1": 116.951, "r_y1": 181.51199999999994, "r_x2": 116.951, "r_y2": 172.96000000000004, "r_x3": 50.112, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "non-empty cells.", "orig": "non-empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.345, "r_y0": 181.51199999999994, "r_x1": 286.365, "r_y1": 181.51199999999994, "r_x2": 286.365, "r_y2": 172.96000000000004, "r_x3": 121.345, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Therefore, it was imperative to introduce", "orig": "Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 193.46699999999998, "r_x1": 286.365, "r_y1": 193.46699999999998, "r_x2": 286.365, "r_y2": 184.91499999999996, "r_x3": 50.112, "r_y3": 184.91499999999996, "coord_origin": "TOPLEFT"}, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 205.423, "r_x1": 286.365, "r_y1": 205.423, "r_x2": 286.365, "r_y2": 196.87099999999998, "r_x3": 50.112, "r_y3": 196.87099999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 217.37800000000004, "r_x1": 286.365, "r_y1": 217.37800000000004, "r_x2": 286.365, "r_y2": 208.82600000000002, "r_x3": 50.112, "r_y3": 208.82600000000002, "coord_origin": "TOPLEFT"}, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 229.33299999999997, "r_x1": 286.365, "r_y1": 229.33299999999997, "r_x2": 286.365, "r_y2": 220.78099999999995, "r_x3": 50.112, "r_y3": 220.78099999999995, "coord_origin": "TOPLEFT"}, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 241.288, "r_x1": 139.805, "r_y1": 241.288, "r_x2": 139.805, "r_y2": 232.736, "r_x3": 50.112, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "ers the table structure.", "orig": "ers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.607, "r_y0": 241.288, "r_x1": 286.365, "r_y1": 241.288, "r_x2": 286.365, "r_y2": 232.736, "r_x3": 144.607, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "Notice that each table cell may oc-", "orig": "Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 253.24300000000005, "r_x1": 286.365, "r_y1": 253.24300000000005, "r_x2": 286.365, "r_y2": 244.69100000000003, "r_x3": 50.112, "r_y3": 244.69100000000003, "coord_origin": "TOPLEFT"}, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 265.198, "r_x1": 286.365, "r_y1": 265.198, "r_x2": 286.365, "r_y2": 256.64599999999996, "r_x3": 50.112, "r_y3": 256.64599999999996, "coord_origin": "TOPLEFT"}, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 277.154, "r_x1": 286.365, "r_y1": 277.154, "r_x2": 286.365, "r_y2": 268.602, "r_x3": 50.112, "r_y3": 268.602, "coord_origin": "TOPLEFT"}, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 289.109, "r_x1": 68.652, "r_y1": 289.109, "r_x2": 68.652, "r_y2": 280.557, "r_x3": 50.112, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.566, "r_y0": 289.109, "r_x1": 286.365, "r_y1": 289.109, "r_x2": 286.365, "r_y2": 280.557, "r_x3": 75.566, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 301.064, "r_x1": 286.365, "r_y1": 301.064, "r_x2": 286.365, "r_y2": 292.512, "r_x3": 50.112, "r_y3": 292.512, "coord_origin": "TOPLEFT"}, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 313.019, "r_x1": 75.696, "r_y1": 313.019, "r_x2": 75.696, "r_y2": 304.467, "r_x3": 50.112, "r_y3": 304.467, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 338.772, "r_x1": 60.075, "r_y1": 338.772, "r_x2": 60.075, "r_y2": 330.22, "r_x3": 50.112, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.146, "r_y0": 338.772, "r_x1": 96.687, "r_y1": 338.772, "r_x2": 96.687, "r_y2": 330.22, "r_x3": 65.146, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.768, "r_y0": 338.772, "r_x1": 113.932, "r_y1": 338.772, "r_x2": 113.932, "r_y2": 330.22, "r_x3": 101.768, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.003, "r_y0": 338.772, "r_x1": 148.533, "r_y1": 338.772, "r_x2": 148.533, "r_y2": 330.22, "r_x3": 119.003, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "skewed", "orig": "skewed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.613, "r_y0": 338.772, "r_x1": 184.806, "r_y1": 338.772, "r_x2": 184.806, "r_y2": 330.22, "r_x3": 153.613, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "towards", "orig": "towards", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.877, "r_y0": 338.772, "r_x1": 219.765, "r_y1": 338.772, "r_x2": 219.765, "r_y2": 330.22, "r_x3": 189.877, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "simpler", "orig": "simpler", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.836, "r_y0": 338.772, "r_x1": 263.571, "r_y1": 338.772, "r_x2": 263.571, "r_y2": 330.22, "r_x3": 224.836, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "structures", "orig": "structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.652, "r_y0": 338.772, "r_x1": 286.365, "r_y1": 338.772, "r_x2": 286.365, "r_y2": 330.22, "r_x3": 268.652, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 350.727, "r_x1": 286.365, "r_y1": 350.727, "r_x2": 286.365, "r_y2": 342.175, "r_x3": 50.112, "r_y3": 342.175, "coord_origin": "TOPLEFT"}, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 362.682, "r_x1": 286.365, "r_y1": 362.682, "r_x2": 286.365, "r_y2": 354.13, "r_x3": 50.112, "r_y3": 354.13, "coord_origin": "TOPLEFT"}, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 374.637, "r_x1": 286.365, "r_y1": 374.637, "r_x2": 286.365, "r_y2": 366.085, "r_x3": 50.112, "r_y3": 366.085, "coord_origin": "TOPLEFT"}, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 386.592, "r_x1": 141.589, "r_y1": 386.592, "r_x2": 141.589, "r_y2": 378.04, "r_x3": 50.112, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.702, "r_y0": 386.592, "r_x1": 286.365, "r_y1": 386.592, "r_x2": 286.365, "r_y2": 378.04, "r_x3": 148.702, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 398.547, "r_x1": 286.365, "r_y1": 398.547, "r_x2": 286.365, "r_y2": 389.995, "r_x3": 50.112, "r_y3": 389.995, "coord_origin": "TOPLEFT"}, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 410.503, "r_x1": 201.822, "r_y1": 410.503, "r_x2": 201.822, "r_y2": 401.951, "r_x3": 50.112, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Net) is restricted to a certain domain.", "orig": "Net) is restricted to a certain domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.764, "r_y0": 410.503, "r_x1": 286.365, "r_y1": 410.503, "r_x2": 286.365, "r_y2": 401.951, "r_x3": 206.764, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Ultimately, the lack", "orig": "Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 422.458, "r_x1": 286.365, "r_y1": 422.458, "r_x2": 286.365, "r_y2": 413.906, "r_x3": 50.112, "r_y3": 413.906, "coord_origin": "TOPLEFT"}, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 434.413, "r_x1": 216.398, "r_y1": 434.413, "r_x2": 216.398, "r_y2": 425.861, "r_x3": 50.112, "r_y3": 425.861, "coord_origin": "TOPLEFT"}, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.165, "r_x1": 172.144, "r_y1": 460.165, "r_x2": 172.144, "r_y2": 451.613, "r_x3": 50.112, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.148, "r_y0": 460.022, "r_x1": 224.708, "r_y1": 460.022, "r_x2": 224.708, "r_y2": 451.434, "r_x3": 174.148, "r_y3": 451.434, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.708, "r_y0": 460.165, "r_x1": 227.199, "r_y1": 460.165, "r_x2": 227.199, "r_y2": 451.613, "r_x3": 224.708, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.128, "r_y0": 460.165, "r_x1": 286.367, "r_y1": 460.165, "r_x2": 286.367, "r_y2": 451.613, "r_x3": 230.128, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "This approach", "orig": "This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 472.121, "r_x1": 128.179, "r_y1": 472.121, "r_x2": 128.179, "r_y2": 463.569, "r_x3": 50.112, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "offers control over:", "orig": "offers control over:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.971, "r_y0": 472.121, "r_x1": 286.365, "r_y1": 472.121, "r_x2": 286.365, "r_y2": 463.569, "r_x3": 132.971, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "1) the size of the dataset, 2) the table", "orig": "1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 484.076, "r_x1": 266.739, "r_y1": 484.076, "r_x2": 266.739, "r_y2": 475.524, "r_x3": 50.112, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "structure, 3) the table style and 4) the type of content.", "orig": "structure, 3) the table style and 4) the type of content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.873, "r_y0": 484.076, "r_x1": 286.365, "r_y1": 484.076, "r_x2": 286.365, "r_y2": 475.524, "r_x3": 270.873, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 496.031, "r_x1": 286.365, "r_y1": 496.031, "r_x2": 286.365, "r_y2": 487.479, "r_x3": 50.112, "r_y3": 487.479, "coord_origin": "TOPLEFT"}, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.986, "r_x1": 286.365, "r_y1": 507.986, "r_x2": 286.365, "r_y2": 499.434, "r_x3": 50.112, "r_y3": 499.434, "coord_origin": "TOPLEFT"}, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.941, "r_x1": 286.365, "r_y1": 519.941, "r_x2": 286.365, "r_y2": 511.389, "r_x3": 50.112, "r_y3": 511.389, "coord_origin": "TOPLEFT"}, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.8969999999999, "r_x1": 286.365, "r_y1": 531.8969999999999, "r_x2": 286.365, "r_y2": 523.345, "r_x3": 50.112, "r_y3": 523.345, "coord_origin": "TOPLEFT"}, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.852, "r_x1": 286.365, "r_y1": 543.852, "r_x2": 286.365, "r_y2": 535.3, "r_x3": 50.112, "r_y3": 535.3, "coord_origin": "TOPLEFT"}, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.807, "r_x1": 286.365, "r_y1": 555.807, "r_x2": 286.365, "r_y2": 547.255, "r_x3": 50.112, "r_y3": 547.255, "coord_origin": "TOPLEFT"}, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.762, "r_x1": 83.028, "r_y1": 567.762, "r_x2": 83.028, "r_y2": 559.21, "r_x3": 50.112, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "corpora.", "orig": "corpora.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.153, "r_y0": 567.762, "r_x1": 286.365, "r_y1": 567.762, "r_x2": 286.365, "r_y2": 559.21, "r_x3": 87.153, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "By controlling the size and scope of the synthetic", "orig": "By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.717, "r_x1": 286.365, "r_y1": 579.717, "r_x2": 286.365, "r_y2": 571.165, "r_x3": 50.112, "r_y3": 571.165, "coord_origin": "TOPLEFT"}, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.672, "r_x1": 174.645, "r_y1": 591.672, "r_x2": 174.645, "r_y2": 583.12, "r_x3": 50.112, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "variety of different conditions.", "orig": "variety of different conditions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.021, "r_y0": 591.672, "r_x1": 286.365, "r_y1": 591.672, "r_x2": 286.365, "r_y2": 583.12, "r_x3": 181.021, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "For example, we can first", "orig": "For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.6279999999999, "r_x1": 286.365, "r_y1": 603.6279999999999, "r_x2": 286.365, "r_y2": 595.076, "r_x3": 50.112, "r_y3": 595.076, "coord_origin": "TOPLEFT"}, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.583, "r_x1": 286.365, "r_y1": 615.583, "r_x2": 286.365, "r_y2": 607.031, "r_x3": 50.112, "r_y3": 607.031, "coord_origin": "TOPLEFT"}, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.538, "r_x1": 209.753, "r_y1": 627.538, "r_x2": 209.753, "r_y2": 618.986, "r_x3": 50.112, "r_y3": 618.986, "coord_origin": "TOPLEFT"}, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 50.112, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 109.519, "r_y1": 689.156, "r_x2": 109.519, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "generated text.", "orig": "generated text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 115.337, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 115.337, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "The first two synthetic datasets have been", "orig": "The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 336.867, "r_y0": 176.48199999999997, "r_x1": 344.618, "r_y1": 176.48199999999997, "r_x2": 344.618, "r_y2": 167.92999999999995, "r_x3": 336.867, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "1:", "orig": "1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.076, "r_y0": 176.48199999999997, "r_x1": 380.453, "r_y1": 176.48199999999997, "r_x2": 380.453, "r_y2": 167.92999999999995, "r_x3": 361.076, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.568, "r_y0": 176.33900000000006, "r_x1": 468.68, "r_y1": 176.33900000000006, "r_x2": 468.68, "r_y2": 167.75099999999998, "r_x3": 386.568, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-Tabnet'", "orig": "'Combined-Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.796, "r_y0": 176.48199999999997, "r_x1": 489.182, "r_y1": 176.48199999999997, "r_x2": 489.182, "r_y2": 167.92999999999995, "r_x3": 474.796, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.299, "r_y0": 176.33900000000006, "r_x1": 545.112, "r_y1": 176.33900000000006, "r_x2": 545.112, "r_y2": 167.75099999999998, "r_x3": 495.299, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-", "orig": "'Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 188.29399999999998, "r_x1": 341.161, "r_y1": 188.29399999999998, "r_x2": 341.161, "r_y2": 179.70600000000002, "r_x3": 308.862, "r_y3": 179.70600000000002, "coord_origin": "TOPLEFT"}, "text": "Tabnet'", "orig": "Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.457, "r_y0": 188.437, "r_x1": 545.11, "r_y1": 188.437, "r_x2": 545.11, "r_y2": 179.885, "r_x3": 343.457, "r_y3": 179.885, "coord_origin": "TOPLEFT"}, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 200.39200000000005, "r_x1": 545.115, "r_y1": 200.39200000000005, "r_x2": 545.115, "r_y2": 191.84000000000003, "r_x3": 308.862, "r_y3": 191.84000000000003, "coord_origin": "TOPLEFT"}, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 212.34699999999998, "r_x1": 366.276, "r_y1": 212.34699999999998, "r_x2": 366.276, "r_y2": 203.79499999999996, "r_x3": 308.862, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "and Fintabnet.", "orig": "and Fintabnet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.58, "r_y0": 212.34699999999998, "r_x1": 545.115, "r_y1": 212.34699999999998, "r_x2": 545.115, "r_y2": 203.79499999999996, "r_x3": 370.58, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "(**) The combined dataset is the processed", "orig": "(**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 224.303, "r_x1": 523.935, "r_y1": 224.303, "r_x2": 523.935, "r_y2": 215.75099999999998, "r_x3": 308.862, "r_y3": 215.75099999999998, "coord_origin": "TOPLEFT"}, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.39599999999996, "r_x1": 545.115, "r_y1": 270.39599999999996, "r_x2": 545.115, "r_y2": 261.84400000000005, "r_x3": 308.862, "r_y3": 261.84400000000005, "coord_origin": "TOPLEFT"}, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.351, "r_x1": 545.115, "r_y1": 282.351, "r_x2": 545.115, "r_y2": 273.799, "r_x3": 308.862, "r_y3": 273.799, "coord_origin": "TOPLEFT"}, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.306, "r_x1": 436.822, "r_y1": 294.306, "r_x2": 436.822, "r_y2": 285.754, "r_x3": 308.862, "r_y3": 285.754, "coord_origin": "TOPLEFT"}, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 362.715, "r_x1": 326.576, "r_y1": 362.715, "r_x2": 326.576, "r_y2": 354.163, "r_x3": 308.862, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "dict:", "orig": "dict:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.172, "r_y0": 362.715, "r_x1": 545.115, "r_y1": 362.715, "r_x2": 545.115, "r_y2": 354.163, "r_x3": 330.172, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "1) a sequence of tokens that represent the structure of", "orig": "1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 374.67, "r_x1": 545.115, "r_y1": 374.67, "r_x2": 545.115, "r_y2": 366.118, "r_x3": 308.862, "r_y3": 366.118, "coord_origin": "TOPLEFT"}, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 386.625, "r_x1": 337.265, "r_y1": 386.625, "r_x2": 337.265, "r_y2": 378.073, "r_x3": 308.862, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "tokens.", "orig": "tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.808, "r_y0": 386.625, "r_x1": 545.115, "r_y1": 386.625, "r_x2": 545.115, "r_y2": 378.073, "r_x3": 341.808, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "The conversion of an image into a sequence of to-", "orig": "The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 398.58, "r_x1": 545.115, "r_y1": 398.58, "r_x2": 545.115, "r_y2": 390.028, "r_x3": 308.862, "r_y3": 390.028, "coord_origin": "TOPLEFT"}, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 410.535, "r_x1": 545.115, "r_y1": 410.535, "r_x2": 545.115, "r_y2": 401.983, "r_x3": 308.862, "r_y3": 401.983, "coord_origin": "TOPLEFT"}, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 422.491, "r_x1": 545.115, "r_y1": 422.491, "r_x2": 545.115, "r_y2": 413.939, "r_x3": 308.862, "r_y3": 413.939, "coord_origin": "TOPLEFT"}, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 434.446, "r_x1": 545.115, "r_y1": 434.446, "r_x2": 545.115, "r_y2": 425.894, "r_x3": 308.862, "r_y3": 425.894, "coord_origin": "TOPLEFT"}, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 446.401, "r_x1": 437.937, "r_y1": 446.401, "r_x2": 437.937, "r_y2": 437.849, "r_x3": 308.862, "r_y3": 437.849, "coord_origin": "TOPLEFT"}, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.541, "r_x1": 315.507, "r_y1": 497.541, "r_x2": 315.507, "r_y2": 488.989, "r_x3": 308.862, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.153, "r_y0": 497.541, "r_x1": 509.021, "r_y1": 497.541, "r_x2": 509.021, "r_y2": 488.989, "r_x3": 319.153, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "composed of three main components, see Fig.", "orig": "composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.586, "r_y0": 497.541, "r_x1": 523.058, "r_y1": 497.541, "r_x2": 523.058, "r_y2": 488.989, "r_x3": 515.586, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 497.541, "r_x1": 545.115, "r_y1": 497.541, "r_x2": 545.115, "r_y2": 488.989, "r_x3": 529.623, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.353, "r_x1": 406.346, "r_y1": 509.353, "r_x2": 406.346, "r_y2": 500.765, "r_x3": 308.862, "r_y3": 500.765, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.872, "r_y0": 509.496, "r_x1": 545.111, "r_y1": 509.496, "r_x2": 545.111, "r_y2": 500.944, "r_x3": 408.872, "r_y3": 500.944, "coord_origin": "TOPLEFT"}, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.452, "r_x1": 319.93, "r_y1": 521.452, "r_x2": 319.93, "r_y2": 512.9, "r_x3": 308.862, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "tor", "orig": "tor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.836, "r_y0": 521.452, "r_x1": 409.395, "r_y1": 521.452, "r_x2": 409.395, "r_y2": 512.9, "r_x3": 323.836, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "of predefined length.", "orig": "of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.727, "r_y0": 521.452, "r_x1": 545.115, "r_y1": 521.452, "r_x2": 545.115, "r_y2": 512.9, "r_x3": 416.727, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.4069999999999, "r_x1": 436.194, "r_y1": 533.4069999999999, "r_x2": 436.194, "r_y2": 524.855, "r_x3": 308.862, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.526, "r_y0": 533.264, "r_x1": 513.867, "r_y1": 533.264, "r_x2": 513.867, "r_y2": 524.6759999999999, "r_x3": 439.526, "r_y3": 524.6759999999999, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 517.432, "r_y0": 533.4069999999999, "r_x1": 545.108, "r_y1": 533.4069999999999, "r_x2": 545.108, "r_y2": 524.855, "r_x3": 517.432, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.362, "r_x1": 545.115, "r_y1": 545.362, "r_x2": 545.115, "r_y2": 536.81, "r_x3": 308.862, "r_y3": 536.81, "coord_origin": "TOPLEFT"}, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.317, "r_x1": 358.545, "r_y1": 557.317, "r_x2": 358.545, "r_y2": 548.765, "r_x3": 308.862, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.191, "r_y0": 557.317, "r_x1": 545.115, "r_y1": 557.317, "r_x2": 545.115, "r_y2": 548.765, "r_x3": 365.191, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.2719999999999, "r_x1": 352.409, "r_y1": 569.2719999999999, "r_x2": 352.409, "r_y2": 560.72, "r_x3": 308.862, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "data cell ('", "orig": "data cell ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.409, "r_y0": 569.108, "r_x1": 360.158, "r_y1": 569.108, "r_x2": 360.158, "r_y2": 560.402, "r_x3": 352.409, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.158, "r_y0": 569.2719999999999, "r_x1": 367.909, "r_y1": 569.2719999999999, "r_x2": 367.909, "r_y2": 560.72, "r_x3": 360.158, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.909, "r_y0": 569.108, "r_x1": 375.658, "r_y1": 569.108, "r_x2": 375.658, "r_y2": 560.402, "r_x3": 367.909, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.658, "r_y0": 569.2719999999999, "r_x1": 545.112, "r_y1": 569.2719999999999, "r_x2": 545.112, "r_y2": 560.72, "r_x3": 375.658, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "') the hidden state of that cell is passed to", "orig": "') the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.2280000000001, "r_x1": 545.115, "r_y1": 581.2280000000001, "r_x2": 545.115, "r_y2": 572.6759999999999, "r_x3": 308.862, "r_y3": 572.6759999999999, "coord_origin": "TOPLEFT"}, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.183, "r_x1": 483.118, "r_y1": 593.183, "r_x2": 483.118, "r_y2": 584.631, "r_x3": 308.862, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "or column span, the tag is broken down to '", "orig": "or column span, the tag is broken down to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 593.019, "r_x1": 490.868, "r_y1": 593.019, "r_x2": 490.868, "r_y2": 584.313, "r_x3": 483.119, "r_y3": 584.313, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.868, "r_y0": 593.183, "r_x1": 545.114, "r_y1": 593.183, "r_x2": 545.114, "r_y2": 584.631, "r_x3": 490.868, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "', 'rowspan='", "orig": "', 'rowspan='", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.138, "r_x1": 545.115, "r_y1": 605.138, "r_x2": 545.115, "r_y2": 596.586, "r_x3": 308.862, "r_y3": 596.586, "coord_origin": "TOPLEFT"}, "text": "or 'colspan=', with the number of spanning cells (attribute),", "orig": "or 'colspan=', with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.093, "r_x1": 329.644, "r_y1": 617.093, "r_x2": 329.644, "r_y2": 608.5409999999999, "r_x3": 308.862, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "and '", "orig": "and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.646, "r_y0": 616.929, "r_x1": 337.395, "r_y1": 616.929, "r_x2": 337.395, "r_y2": 608.223, "r_x3": 329.646, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.394, "r_y0": 617.093, "r_x1": 343.202, "r_y1": 617.093, "r_x2": 343.202, "r_y2": 608.5409999999999, "r_x3": 337.394, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "'.", "orig": "'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.064, "r_y0": 617.093, "r_x1": 468.591, "r_y1": 617.093, "r_x2": 468.591, "r_y2": 608.5409999999999, "r_x3": 348.064, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "The hidden state attached to '", "orig": "The hidden state attached to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.595, "r_y0": 616.929, "r_x1": 476.344, "r_y1": 616.929, "r_x2": 476.344, "r_y2": 608.223, "r_x3": 468.595, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.344, "r_y0": 617.093, "r_x1": 545.116, "r_y1": 617.093, "r_x2": 545.116, "r_y2": 608.5409999999999, "r_x3": 476.344, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "' is passed to the", "orig": "' is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.048, "r_x1": 545.115, "r_y1": 629.048, "r_x2": 545.115, "r_y2": 620.496, "r_x3": 308.862, "r_y3": 620.496, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0029999999999, "r_x1": 533.2, "r_y1": 641.0029999999999, "r_x2": 533.2, "r_y2": 632.451, "r_x3": 308.862, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "receives the hidden states from the Structure Decoder,", "orig": "receives the hidden states from the Structure Decoder,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.364, "r_y0": 641.0029999999999, "r_x1": 545.115, "r_y1": 641.0029999999999, "r_x2": 545.115, "r_y2": 632.451, "r_x3": 537.364, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.9590000000001, "r_x1": 545.115, "r_y1": 652.9590000000001, "r_x2": 545.115, "r_y2": 644.407, "r_x3": 308.862, "r_y3": 644.407, "coord_origin": "TOPLEFT"}, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.914, "r_x1": 449.424, "r_y1": 664.914, "r_x2": 449.424, "r_y2": 656.362, "r_x3": 308.862, "r_y3": 656.362, "coord_origin": "TOPLEFT"}, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.499, "r_y0": 677.201, "r_x1": 545.113, "r_y1": 677.201, "r_x2": 545.113, "r_y2": 668.649, "r_x3": 439.499, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9611433148384094, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 101.22900000000004, "r": 286.365, "b": 109.78099999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.988013744354248, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "caption", "bbox": {"l": 308.862, "t": 167.92999999999995, "r": 330.75, "b": 176.48199999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9667726755142212, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "text", "bbox": {"l": 308.862, "t": 249.889, "r": 545.115, "b": 258.44100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.978954017162323, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 320.817, "t": 298.041, "r": 542.744, "b": 306.593, "coord_origin": "TOPLEFT"}, "confidence": 0.9043695330619812, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 318.264, "r": 286.365, "b": 326.816, "coord_origin": "TOPLEFT"}, "confidence": 0.9873981475830078, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "section_header", "bbox": {"l": 308.862, "t": 321.184, "r": 444.936, "b": 331.932, "coord_origin": "TOPLEFT"}, "confidence": 0.9466595649719238, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 342.208, "r": 545.115, "b": 350.76, "coord_origin": "TOPLEFT"}, "confidence": 0.9884450435638428, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 439.658, "r": 286.365, "b": 448.21, "coord_origin": "TOPLEFT"}, "confidence": 0.9876030087471008, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "section_header", "bbox": {"l": 308.862, "t": 457.694, "r": 420.161, "b": 467.546, "coord_origin": "TOPLEFT"}, "confidence": 0.937696099281311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 477.034, "r": 545.115, "b": 485.586, "coord_origin": "TOPLEFT"}, "confidence": 0.9878323078155518, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "text", "bbox": {"l": 62.067, "t": 632.783, "r": 286.365, "b": 641.335, "coord_origin": "TOPLEFT"}, "confidence": 0.9871614575386047, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 320.817, "t": 668.261, "r": 431.91, "b": 677.217, "coord_origin": "TOPLEFT"}, "confidence": 0.978580117225647, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8565718531608582, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"8": {"label": "table", "id": 8, "page_no": 3, "cluster": {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 10, "page_no": 3, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9611433148384094, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "amount of such tables, and kept only those ones ranging"}, {"label": "text", "id": 1, "page_no": 3, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 101.22900000000004, "r": 286.365, "b": 109.78099999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.988013744354248, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The availability of the bounding boxes for all table cells"}, {"label": "caption", "id": 9, "page_no": 3, "cluster": {"id": 9, "label": "caption", "bbox": {"l": 308.862, "t": 167.92999999999995, "r": 330.75, "b": 176.48199999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9667726755142212, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table"}, {"label": "text", "id": 6, "page_no": 3, "cluster": {"id": 6, "label": "text", "bbox": {"l": 308.862, "t": 249.889, "r": 545.115, "b": 258.44100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.978954017162323, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "one adopts a colorful appearance with high contrast and the"}, {"label": "text", "id": 13, "page_no": 3, "cluster": {"id": 13, "label": "text", "bbox": {"l": 320.817, "t": 298.041, "r": 542.744, "b": 306.593, "coord_origin": "TOPLEFT"}, "confidence": 0.9043695330619812, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tab. 1 summarizes the various attributes of the datasets."}, {"label": "text", "id": 4, "page_no": 3, "cluster": {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 318.264, "r": 286.365, "b": 326.816, "coord_origin": "TOPLEFT"}, "confidence": 0.9873981475830078, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As it is illustrated in Fig. 2, the table distributions from"}, {"label": "section_header", "id": 11, "page_no": 3, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 308.862, "t": 321.184, "r": 444.936, "b": 331.932, "coord_origin": "TOPLEFT"}, "confidence": 0.9466595649719238, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. The TableFormer model"}, {"label": "text", "id": 0, "page_no": 3, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 342.208, "r": 545.115, "b": 350.76, "coord_origin": "TOPLEFT"}, "confidence": 0.9884450435638428, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Given the image of a table, TableFormer is able to pre-"}, {"label": "text", "id": 3, "page_no": 3, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 439.658, "r": 286.365, "b": 448.21, "coord_origin": "TOPLEFT"}, "confidence": 0.9876030087471008, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Motivated by those observations we aimed at generating"}, {"label": "section_header", "id": 12, "page_no": 3, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 308.862, "t": 457.694, "r": 420.161, "b": 467.546, "coord_origin": "TOPLEFT"}, "confidence": 0.937696099281311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.1. Model architecture."}, {"label": "text", "id": 2, "page_no": 3, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 477.034, "r": 545.115, "b": 485.586, "coord_origin": "TOPLEFT"}, "confidence": 0.9878323078155518, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We now describe in detail the proposed method, which"}, {"label": "text", "id": 5, "page_no": 3, "cluster": {"id": 5, "label": "text", "bbox": {"l": 62.067, "t": 632.783, "r": 286.365, "b": 641.335, "coord_origin": "TOPLEFT"}, "confidence": 0.9871614575386047, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this regard, we have prepared four synthetic datasets,"}, {"label": "text", "id": 7, "page_no": 3, "cluster": {"id": 7, "label": "text", "bbox": {"l": 320.817, "t": 668.261, "r": 431.91, "b": 677.217, "coord_origin": "TOPLEFT"}, "confidence": 0.978580117225647, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "CNN Backbone Network."}, {"label": "page_footer", "id": 14, "page_no": 3, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8565718531608582, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4"}, {"label": "table", "id": 8, "page_no": 3, "cluster": {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "text", "id": 10, "page_no": 3, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9611433148384094, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "amount of such tables, and kept only those ones ranging"}, {"label": "text", "id": 1, "page_no": 3, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 101.22900000000004, "r": 286.365, "b": 109.78099999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.988013744354248, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The availability of the bounding boxes for all table cells"}, {"label": "caption", "id": 9, "page_no": 3, "cluster": {"id": 9, "label": "caption", "bbox": {"l": 308.862, "t": 167.92999999999995, "r": 330.75, "b": 176.48199999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9667726755142212, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table"}, {"label": "text", "id": 6, "page_no": 3, "cluster": {"id": 6, "label": "text", "bbox": {"l": 308.862, "t": 249.889, "r": 545.115, "b": 258.44100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.978954017162323, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "one adopts a colorful appearance with high contrast and the"}, {"label": "text", "id": 13, "page_no": 3, "cluster": {"id": 13, "label": "text", "bbox": {"l": 320.817, "t": 298.041, "r": 542.744, "b": 306.593, "coord_origin": "TOPLEFT"}, "confidence": 0.9043695330619812, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tab. 1 summarizes the various attributes of the datasets."}, {"label": "text", "id": 4, "page_no": 3, "cluster": {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 318.264, "r": 286.365, "b": 326.816, "coord_origin": "TOPLEFT"}, "confidence": 0.9873981475830078, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As it is illustrated in Fig. 2, the table distributions from"}, {"label": "section_header", "id": 11, "page_no": 3, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 308.862, "t": 321.184, "r": 444.936, "b": 331.932, "coord_origin": "TOPLEFT"}, "confidence": 0.9466595649719238, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. The TableFormer model"}, {"label": "text", "id": 0, "page_no": 3, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 342.208, "r": 545.115, "b": 350.76, "coord_origin": "TOPLEFT"}, "confidence": 0.9884450435638428, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Given the image of a table, TableFormer is able to pre-"}, {"label": "text", "id": 3, "page_no": 3, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 439.658, "r": 286.365, "b": 448.21, "coord_origin": "TOPLEFT"}, "confidence": 0.9876030087471008, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Motivated by those observations we aimed at generating"}, {"label": "section_header", "id": 12, "page_no": 3, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 308.862, "t": 457.694, "r": 420.161, "b": 467.546, "coord_origin": "TOPLEFT"}, "confidence": 0.937696099281311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.1. Model architecture."}, {"label": "text", "id": 2, "page_no": 3, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 477.034, "r": 545.115, "b": 485.586, "coord_origin": "TOPLEFT"}, "confidence": 0.9878323078155518, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We now describe in detail the proposed method, which"}, {"label": "text", "id": 5, "page_no": 3, "cluster": {"id": 5, "label": "text", "bbox": {"l": 62.067, "t": 632.783, "r": 286.365, "b": 641.335, "coord_origin": "TOPLEFT"}, "confidence": 0.9871614575386047, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this regard, we have prepared four synthetic datasets,"}, {"label": "text", "id": 7, "page_no": 3, "cluster": {"id": 7, "label": "text", "bbox": {"l": 320.817, "t": 668.261, "r": 431.91, "b": 677.217, "coord_origin": "TOPLEFT"}, "confidence": 0.978580117225647, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "CNN Backbone Network."}, {"label": "table", "id": 8, "page_no": 3, "cluster": {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_footer", "id": 14, "page_no": 3, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8565718531608582, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4"}]}}, {"page_no": 4, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.021, "r_y0": 212.942, "r_x1": 149.851, "r_y1": 212.942, "r_x2": 149.851, "r_y2": 203.986, "r_x3": 94.021, "r_y3": 203.986, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.861, "r_y0": 212.92600000000004, "r_x1": 545.108, "r_y1": 212.92600000000004, "r_x2": 545.108, "r_y2": 204.37400000000002, "r_x3": 152.861, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 224.88099999999997, "r_x1": 436.013, "r_y1": 224.88099999999997, "r_x2": 436.013, "r_y2": 216.32899999999995, "r_x3": 50.112, "r_y3": 216.32899999999995, "coord_origin": "TOPLEFT"}, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 162.988, "r_y1": 274.491, "r_x2": 162.988, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 80.27, "r_y1": 343.926, "r_x2": 80.27, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 154.665, "r_y1": 298.344, "r_x2": 154.665, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 271.778, "r_y1": 410.598, "r_x2": 271.778, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 270.786, "r_y1": 443.622, "r_x2": 270.785, "r_y2": 439.21, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 212.161, "r_y1": 298.506, "r_x2": 212.161, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 197.29, "r_y1": 328.837, "r_x2": 197.29, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.73, "r_y0": 536.723, "r_x1": 229.787, "r_y1": 536.723, "r_x2": 229.787, "r_y2": 528.171, "r_x3": 90.73, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Given an input image of a table, the", "orig": "Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.787, "r_y0": 536.739, "r_x1": 267.762, "r_y1": 536.739, "r_x2": 267.762, "r_y2": 527.783, "r_x3": 231.787, "r_y3": 527.783, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.764, "r_y0": 536.723, "r_x1": 286.362, "r_y1": 536.723, "r_x2": 286.362, "r_y2": 528.171, "r_x3": 269.764, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 548.678, "r_x1": 286.365, "r_y1": 548.678, "r_x2": 286.365, "r_y2": 540.126, "r_x3": 50.112, "r_y3": 540.126, "coord_origin": "TOPLEFT"}, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 560.634, "r_x1": 205.847, "r_y1": 560.634, "r_x2": 205.847, "r_y2": 552.082, "r_x3": 50.112, "r_y3": 552.082, "coord_origin": "TOPLEFT"}, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.018, "r_y0": 560.65, "r_x1": 286.364, "r_y1": 560.65, "r_x2": 286.364, "r_y2": 551.694, "r_x3": 208.018, "r_y3": 551.694, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 572.5889999999999, "r_x1": 64.498, "r_y1": 572.5889999999999, "r_x2": 64.498, "r_y2": 564.037, "r_x3": 50.112, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.165, "r_y0": 572.605, "r_x1": 151.313, "r_y1": 572.605, "r_x2": 151.313, "r_y2": 563.649, "r_x3": 68.165, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.313, "r_y0": 572.5889999999999, "r_x1": 153.804, "r_y1": 572.5889999999999, "r_x2": 153.804, "r_y2": 564.037, "r_x3": 151.313, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.419, "r_y0": 572.5889999999999, "r_x1": 241.933, "r_y1": 572.5889999999999, "r_x2": 241.933, "r_y2": 564.037, "r_x3": 160.419, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.595, "r_y0": 572.605, "r_x1": 286.362, "r_y1": 572.605, "r_x2": 286.362, "r_y2": 563.649, "r_x3": 245.595, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 584.56, "r_x1": 85.519, "r_y1": 584.56, "r_x2": 85.519, "r_y2": 575.604, "r_x3": 50.112, "r_y3": 575.604, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.623, "r_y0": 584.544, "r_x1": 286.361, "r_y1": 584.544, "r_x2": 286.361, "r_y2": 575.992, "r_x3": 88.623, "r_y3": 575.992, "coord_origin": "TOPLEFT"}, "text": "receives 'tokenized tags' of the HTML code that", "orig": "receives 'tokenized tags' of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 596.499, "r_x1": 286.365, "r_y1": 596.499, "r_x2": 286.365, "r_y2": 587.947, "r_x3": 50.112, "r_y3": 587.947, "coord_origin": "TOPLEFT"}, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 608.454, "r_x1": 286.365, "r_y1": 608.454, "r_x2": 286.365, "r_y2": 599.902, "r_x3": 50.112, "r_y3": 599.902, "coord_origin": "TOPLEFT"}, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 620.409, "r_x1": 240.438, "r_y1": 620.409, "r_x2": 240.438, "r_y2": 611.857, "r_x3": 50.112, "r_y3": 611.857, "coord_origin": "TOPLEFT"}, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.198, "r_y0": 620.425, "r_x1": 286.366, "r_y1": 620.425, "r_x2": 286.366, "r_y2": 611.469, "r_x3": 243.198, "r_y3": 611.469, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 632.381, "r_x1": 87.013, "r_y1": 632.381, "r_x2": 87.013, "r_y2": 623.425, "r_x3": 50.112, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "Decoder.", "orig": "Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.14, "r_y0": 632.381, "r_x1": 286.365, "r_y1": 632.381, "r_x2": 286.365, "r_y2": 623.425, "r_x3": 93.14, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "The linear layer is applied to the features to", "orig": "The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 644.336, "r_x1": 286.365, "r_y1": 644.336, "r_x2": 286.365, "r_y2": 635.38, "r_x3": 50.112, "r_y3": 635.38, "coord_origin": "TOPLEFT"}, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 656.275, "r_x1": 220.582, "r_y1": 656.275, "r_x2": 220.582, "r_y2": 647.723, "r_x3": 50.112, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "selects features referring to the data cells ('", "orig": "selects features referring to the data cells ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.578, "r_y0": 656.111, "r_x1": 228.327, "r_y1": 656.111, "r_x2": 228.327, "r_y2": 647.405, "r_x3": 220.578, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.327, "r_y0": 656.275, "r_x1": 236.078, "r_y1": 656.275, "r_x2": 236.078, "r_y2": 647.723, "r_x3": 228.327, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.078, "r_y0": 656.111, "r_x1": 243.827, "r_y1": 656.111, "r_x2": 243.827, "r_y2": 647.405, "r_x3": 236.078, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.826, "r_y0": 656.275, "r_x1": 255.293, "r_y1": 656.275, "r_x2": 255.293, "r_y2": 647.723, "r_x3": 243.826, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "', '", "orig": "', '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.291, "r_y0": 656.111, "r_x1": 263.04, "r_y1": 656.111, "r_x2": 263.04, "r_y2": 647.405, "r_x3": 255.291, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.04, "r_y0": 656.275, "r_x1": 286.362, "r_y1": 656.275, "r_x2": 286.362, "r_y2": 647.723, "r_x3": 263.04, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "') and", "orig": "') and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 668.23, "r_x1": 286.365, "r_y1": 668.23, "r_x2": 286.365, "r_y2": 659.678, "r_x3": 50.112, "r_y3": 659.678, "coord_origin": "TOPLEFT"}, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 680.185, "r_x1": 218.47, "r_y1": 680.185, "r_x2": 218.47, "r_y2": 671.633, "r_x3": 50.112, "r_y3": 671.633, "coord_origin": "TOPLEFT"}, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.31100000000004, "r_x1": 366.466, "r_y1": 270.31100000000004, "r_x2": 366.466, "r_y2": 261.759, "r_x3": 308.862, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "of size 28*28.", "orig": "of size 28*28.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.706, "r_y0": 270.31100000000004, "r_x1": 545.115, "r_y1": 270.31100000000004, "r_x2": 545.115, "r_y2": 261.759, "r_x3": 371.706, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "ResNet by default downsamples the image", "orig": "ResNet by default downsamples the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.266, "r_x1": 545.115, "r_y1": 282.266, "r_x2": 545.115, "r_y2": 273.71400000000006, "r_x3": 308.862, "r_y3": 273.71400000000006, "coord_origin": "TOPLEFT"}, "text": "resolution by 32 and then the encoded image is provided to", "orig": "resolution by 32 and then the encoded image is provided to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.221, "r_x1": 341.24, "r_y1": 294.221, "r_x2": 341.24, "r_y2": 285.669, "r_x3": 308.862, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.731, "r_y0": 294.078, "r_x1": 417.235, "r_y1": 294.078, "r_x2": 417.235, "r_y2": 285.49, "r_x3": 343.731, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.234, "r_y0": 294.221, "r_x1": 436.601, "r_y1": 294.221, "r_x2": 436.601, "r_y2": 285.669, "r_x3": 417.234, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.092, "r_y0": 294.078, "r_x1": 516.561, "r_y1": 294.078, "r_x2": 516.561, "r_y2": 285.49, "r_x3": 439.092, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.561, "r_y0": 294.221, "r_x1": 519.052, "r_y1": 294.221, "r_x2": 519.052, "r_y2": 285.669, "r_x3": 516.561, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.914, "r_y0": 306.28, "r_x1": 545.114, "r_y1": 306.28, "r_x2": 545.114, "r_y2": 297.728, "r_x3": 403.914, "r_y3": 297.728, "coord_origin": "TOPLEFT"}, "text": "The transformer architecture of this", "orig": "The transformer architecture of this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.235, "r_x1": 517.529, "r_y1": 318.235, "r_x2": 517.529, "r_y2": 309.683, "r_x3": 308.862, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.094, "r_y0": 318.235, "r_x1": 545.115, "r_y1": 318.235, "r_x2": 545.115, "r_y2": 309.683, "r_x3": 524.094, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.19, "r_x1": 432.358, "r_y1": 330.19, "r_x2": 432.358, "r_y2": 321.638, "r_x3": 308.862, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.82, "r_y0": 330.047, "r_x1": 510.29, "r_y1": 330.047, "r_x2": 510.29, "r_y2": 321.459, "r_x3": 435.82, "r_y3": 321.459, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.978, "r_y0": 330.19, "r_x1": 520.623, "r_y1": 330.19, "r_x2": 520.623, "r_y2": 321.638, "r_x3": 513.978, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.08, "r_y0": 330.19, "r_x1": 545.111, "r_y1": 330.19, "r_x2": 545.111, "r_y2": 321.638, "r_x3": 524.08, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 342.145, "r_x1": 545.115, "r_y1": 342.145, "r_x2": 545.115, "r_y2": 333.593, "r_x3": 308.862, "r_y3": 333.593, "coord_origin": "TOPLEFT"}, "text": "eled as a transformer encoder with two encoder layers and", "orig": "eled as a transformer encoder with two encoder layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.1, "r_x1": 545.115, "r_y1": 354.1, "r_x2": 545.115, "r_y2": 345.548, "r_x3": 308.862, "r_y3": 345.548, "coord_origin": "TOPLEFT"}, "text": "a transformer decoder made from a stack of 4 decoder lay-", "orig": "a transformer decoder made from a stack of 4 decoder lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.056, "r_x1": 545.115, "r_y1": 366.056, "r_x2": 545.115, "r_y2": 357.504, "r_x3": 308.862, "r_y3": 357.504, "coord_origin": "TOPLEFT"}, "text": "ers that comprise mainly of multi-head attention and feed", "orig": "ers that comprise mainly of multi-head attention and feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.011, "r_x1": 370.391, "r_y1": 378.011, "r_x2": 370.391, "r_y2": 369.459, "r_x3": 308.862, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.445, "r_y0": 378.011, "r_x1": 545.115, "r_y1": 378.011, "r_x2": 545.115, "r_y2": 369.459, "r_x3": 377.445, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "This configuration uses fewer layers and", "orig": "This configuration uses fewer layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 389.966, "r_x1": 545.115, "r_y1": 389.966, "r_x2": 545.115, "r_y2": 381.414, "r_x3": 308.862, "r_y3": 381.414, "coord_origin": "TOPLEFT"}, "text": "heads in comparison to networks applied to other problems", "orig": "heads in comparison to networks applied to other problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 401.921, "r_x1": 326.566, "r_y1": 401.921, "r_x2": 326.566, "r_y2": 393.369, "r_x3": 308.862, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.069, "r_y0": 401.921, "r_x1": 545.115, "r_y1": 401.921, "r_x2": 545.115, "r_y2": 393.369, "r_x3": 331.069, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "'Scene Understanding', 'Image Captioning'), some-", "orig": "'Scene Understanding', 'Image Captioning'), some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 413.876, "r_x1": 528.019, "r_y1": 413.876, "r_x2": 528.019, "r_y2": 405.324, "r_x3": 308.862, "r_y3": 405.324, "coord_origin": "TOPLEFT"}, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.579, "r_y0": 425.935, "r_x1": 388.055, "r_y1": 425.935, "r_x2": 388.055, "r_y2": 417.383, "r_x3": 341.579, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.325, "r_y0": 425.935, "r_x1": 424.856, "r_y1": 425.935, "r_x2": 424.856, "r_y2": 417.383, "r_x3": 393.325, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoder", "orig": "encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.117, "r_y0": 425.935, "r_x1": 462.356, "r_y1": 425.935, "r_x2": 462.356, "r_y2": 417.383, "r_x3": 430.117, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "receives", "orig": "receives", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.626, "r_y0": 425.935, "r_x1": 477.031, "r_y1": 425.935, "r_x2": 477.031, "r_y2": 417.383, "r_x3": 467.626, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "an", "orig": "an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.301, "r_y0": 425.935, "r_x1": 515.496, "r_y1": 425.935, "r_x2": 515.496, "r_y2": 417.383, "r_x3": 482.301, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoded", "orig": "encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 520.766, "r_y0": 425.935, "r_x1": 545.115, "r_y1": 425.935, "r_x2": 545.115, "r_y2": 417.383, "r_x3": 520.766, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 437.89, "r_x1": 343.721, "r_y1": 437.89, "r_x2": 343.721, "r_y2": 429.338, "r_x3": 308.862, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.038, "r_y0": 437.747, "r_x1": 446.455, "r_y1": 437.747, "r_x2": 446.455, "r_y2": 429.159, "r_x3": 347.038, "r_y3": 429.159, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.94, "r_y0": 437.89, "r_x1": 545.113, "r_y1": 437.89, "r_x2": 545.113, "r_y2": 429.338, "r_x3": 449.94, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "and refines it through a", "orig": "and refines it through a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.845, "r_x1": 545.115, "r_y1": 449.845, "r_x2": 545.115, "r_y2": 441.293, "r_x3": 308.862, "r_y3": 441.293, "coord_origin": "TOPLEFT"}, "text": "multi-head dot-product attention layer, followed by a Feed", "orig": "multi-head dot-product attention layer, followed by a Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 461.8, "r_x1": 384.149, "r_y1": 461.8, "r_x2": 384.149, "r_y2": 453.248, "r_x3": 308.862, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.375, "r_y0": 461.8, "r_x1": 459.616, "r_y1": 461.8, "r_x2": 459.616, "r_y2": 453.248, "r_x3": 393.375, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "During training,", "orig": "During training,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.667, "r_y0": 461.8, "r_x1": 476.841, "r_y1": 461.8, "r_x2": 476.841, "r_y2": 453.248, "r_x3": 464.667, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 481.374, "r_y0": 461.8, "r_x1": 527.85, "r_y1": 461.8, "r_x2": 527.85, "r_y2": 453.248, "r_x3": 481.374, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.393, "r_y0": 461.8, "r_x1": 545.115, "r_y1": 461.8, "r_x2": 545.115, "r_y2": 453.248, "r_x3": 532.393, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.756, "r_x1": 545.115, "r_y1": 473.756, "r_x2": 545.115, "r_y2": 465.204, "r_x3": 308.862, "r_y3": 465.204, "coord_origin": "TOPLEFT"}, "text": "coder receives as input the output feature produced by the", "orig": "coder receives as input the output feature produced by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.711, "r_x1": 545.115, "r_y1": 485.711, "r_x2": 545.115, "r_y2": 477.159, "r_x3": 308.862, "r_y3": 477.159, "coord_origin": "TOPLEFT"}, "text": "transformer encoder, and the tokenized input of the HTML", "orig": "transformer encoder, and the tokenized input of the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.666, "r_x1": 545.115, "r_y1": 497.666, "r_x2": 545.115, "r_y2": 489.114, "r_x3": 308.862, "r_y3": 489.114, "coord_origin": "TOPLEFT"}, "text": "ground-truth tags. Using a stack of multi-head attention lay-", "orig": "ground-truth tags. Using a stack of multi-head attention lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.621, "r_x1": 545.115, "r_y1": 509.621, "r_x2": 545.115, "r_y2": 501.069, "r_x3": 308.862, "r_y3": 501.069, "coord_origin": "TOPLEFT"}, "text": "ers, different aspects of the tag sequence could be inferred.", "orig": "ers, different aspects of the tag sequence could be inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.576, "r_x1": 545.115, "r_y1": 521.576, "r_x2": 545.115, "r_y2": 513.024, "r_x3": 308.862, "r_y3": 513.024, "coord_origin": "TOPLEFT"}, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.5319999999999, "r_x1": 545.115, "r_y1": 533.5319999999999, "r_x2": 545.115, "r_y2": 524.98, "r_x3": 308.862, "r_y3": 524.98, "coord_origin": "TOPLEFT"}, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.487, "r_x1": 369.733, "r_y1": 545.487, "r_x2": 369.733, "r_y2": 536.935, "r_x3": 308.862, "r_y3": 536.935, "coord_origin": "TOPLEFT"}, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.341, "r_y0": 557.545, "r_x1": 545.115, "r_y1": 557.545, "r_x2": 545.115, "r_y2": 548.9929999999999, "r_x3": 410.341, "r_y3": 548.9929999999999, "coord_origin": "TOPLEFT"}, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.501, "r_x1": 545.115, "r_y1": 569.501, "r_x2": 545.115, "r_y2": 560.9490000000001, "r_x3": 308.862, "r_y3": 560.9490000000001, "coord_origin": "TOPLEFT"}, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.456, "r_x1": 545.115, "r_y1": 581.456, "r_x2": 545.115, "r_y2": 572.904, "r_x3": 308.862, "r_y3": 572.904, "coord_origin": "TOPLEFT"}, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4110000000001, "r_x1": 336.458, "r_y1": 593.4110000000001, "r_x2": 336.458, "r_y2": 584.859, "r_x3": 308.862, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "to end.", "orig": "to end.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.971, "r_y0": 593.4110000000001, "r_x1": 545.115, "r_y1": 593.4110000000001, "r_x2": 545.115, "r_y2": 584.859, "r_x3": 340.971, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "This approach is inspired by DETR [1] which em-", "orig": "This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.366, "r_x1": 545.115, "r_y1": 605.366, "r_x2": 545.115, "r_y2": 596.814, "r_x3": 308.862, "r_y3": 596.814, "coord_origin": "TOPLEFT"}, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.321, "r_x1": 545.115, "r_y1": 617.321, "r_x2": 545.115, "r_y2": 608.769, "r_x3": 308.862, "r_y3": 608.769, "coord_origin": "TOPLEFT"}, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.2760000000001, "r_x1": 545.115, "r_y1": 629.2760000000001, "r_x2": 545.115, "r_y2": 620.7239999999999, "r_x3": 308.862, "r_y3": 620.7239999999999, "coord_origin": "TOPLEFT"}, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.232, "r_x1": 381.679, "r_y1": 641.232, "r_x2": 381.679, "r_y2": 632.6800000000001, "r_x3": 308.862, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.997, "r_y0": 641.068, "r_x1": 391.746, "r_y1": 641.068, "r_x2": 391.746, "r_y2": 632.362, "r_x3": 383.997, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.746, "r_y0": 641.232, "r_x1": 399.497, "r_y1": 641.232, "r_x2": 399.497, "r_y2": 632.6800000000001, "r_x3": 391.746, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.497, "r_y0": 641.068, "r_x1": 407.246, "r_y1": 641.068, "r_x2": 407.246, "r_y2": 632.362, "r_x3": 399.497, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.246, "r_y0": 641.232, "r_x1": 432.91, "r_y1": 641.232, "r_x2": 432.91, "r_y2": 632.6800000000001, "r_x3": 407.246, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' and '", "orig": "' and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.908, "r_y0": 641.068, "r_x1": 440.657, "r_y1": 641.068, "r_x2": 440.657, "r_y2": 632.362, "r_x3": 432.908, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.657, "r_y0": 641.232, "r_x1": 545.115, "r_y1": 641.232, "r_x2": 545.115, "r_y2": 632.6800000000001, "r_x3": 440.657, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' HTML structure tags be-", "orig": "' HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.187, "r_x1": 398.964, "r_y1": 653.187, "r_x2": 398.964, "r_y2": 644.635, "r_x3": 308.862, "r_y3": 644.635, "coord_origin": "TOPLEFT"}, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.006, "r_y0": 665.103, "r_x1": 545.108, "r_y1": 665.103, "r_x2": 545.108, "r_y2": 656.515, "r_x3": 447.006, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 470.425, "r_y1": 713.066, "r_x2": 470.425, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "provide an attention weighted encoding.", "orig": "provide an attention weighted encoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.63, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 474.63, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "This weighted at-", "orig": "This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 204.37400000000002, "r": 86.884, "b": 212.92600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9677652716636658, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 249.803, "r": 545.115, "b": 258.355, "coord_origin": "TOPLEFT"}, "confidence": 0.9831458330154419, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 297.34, "r": 400.866, "b": 306.296, "coord_origin": "TOPLEFT"}, "confidence": 0.9862009882926941, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 417.383, "r": 336.309, "b": 425.935, "coord_origin": "TOPLEFT"}, "confidence": 0.9851906895637512, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "caption", "bbox": {"l": 50.112, "t": 528.171, "r": 85.878, "b": 536.723, "coord_origin": "TOPLEFT"}, "confidence": 0.8913407325744629, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 548.605, "r": 404.762, "b": 557.561, "coord_origin": "TOPLEFT"}, "confidence": 0.9869195818901062, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 656.694, "r": 444.343, "b": 665.246, "coord_origin": "TOPLEFT"}, "confidence": 0.9852352142333984, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8719564080238342, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "picture", "bbox": {"l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT"}, "confidence": 0.9296807646751404, "cells": [], "children": []}, {"id": 5, "label": "picture", "bbox": {"l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT"}, "confidence": 0.9724942445755005, "cells": [], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 6, "page_no": 4, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 204.37400000000002, "r": 86.884, "b": 212.92600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9677652716636658, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 3:"}, {"label": "text", "id": 4, "page_no": 4, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 249.803, "r": 545.115, "b": 258.355, "coord_origin": "TOPLEFT"}, "confidence": 0.9831458330154419, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "forming classification, and adding an adaptive pooling layer"}, {"label": "text", "id": 1, "page_no": 4, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 297.34, "r": 400.866, "b": 306.296, "coord_origin": "TOPLEFT"}, "confidence": 0.9862009882926941, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure Decoder."}, {"label": "text", "id": 3, "page_no": 4, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 417.383, "r": 336.309, "b": 425.935, "coord_origin": "TOPLEFT"}, "confidence": 0.9851906895637512, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The"}, {"label": "caption", "id": 8, "page_no": 4, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 50.112, "t": 528.171, "r": 85.878, "b": 536.723, "coord_origin": "TOPLEFT"}, "confidence": 0.8913407325744629, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 4:"}, {"label": "text", "id": 0, "page_no": 4, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 548.605, "r": 404.762, "b": 557.561, "coord_origin": "TOPLEFT"}, "confidence": 0.9869195818901062, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell BBox Decoder."}, {"label": "text", "id": 2, "page_no": 4, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 656.694, "r": 444.343, "b": 665.246, "coord_origin": "TOPLEFT"}, "confidence": 0.9852352142333984, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The encoding generated by the"}, {"label": "page_footer", "id": 9, "page_no": 4, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8719564080238342, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5"}, {"label": "picture", "id": 7, "page_no": 4, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT"}, "confidence": 0.9296807646751404, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 5, "page_no": 4, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT"}, "confidence": 0.9724942445755005, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 6, "page_no": 4, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 204.37400000000002, "r": 86.884, "b": 212.92600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9677652716636658, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 3:"}, {"label": "text", "id": 4, "page_no": 4, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 249.803, "r": 545.115, "b": 258.355, "coord_origin": "TOPLEFT"}, "confidence": 0.9831458330154419, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "forming classification, and adding an adaptive pooling layer"}, {"label": "text", "id": 1, "page_no": 4, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 297.34, "r": 400.866, "b": 306.296, "coord_origin": "TOPLEFT"}, "confidence": 0.9862009882926941, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure Decoder."}, {"label": "text", "id": 3, "page_no": 4, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 417.383, "r": 336.309, "b": 425.935, "coord_origin": "TOPLEFT"}, "confidence": 0.9851906895637512, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The"}, {"label": "caption", "id": 8, "page_no": 4, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 50.112, "t": 528.171, "r": 85.878, "b": 536.723, "coord_origin": "TOPLEFT"}, "confidence": 0.8913407325744629, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 4:"}, {"label": "text", "id": 0, "page_no": 4, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 548.605, "r": 404.762, "b": 557.561, "coord_origin": "TOPLEFT"}, "confidence": 0.9869195818901062, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell BBox Decoder."}, {"label": "text", "id": 2, "page_no": 4, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 656.694, "r": 444.343, "b": 665.246, "coord_origin": "TOPLEFT"}, "confidence": 0.9852352142333984, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The encoding generated by the"}, {"label": "picture", "id": 7, "page_no": 4, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT"}, "confidence": 0.9296807646751404, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 5, "page_no": 4, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT"}, "confidence": 0.9724942445755005, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 9, "page_no": 4, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8719564080238342, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5"}]}}, {"page_no": 5, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 286.365, "r_y1": 107.93899999999996, "r_x2": 286.365, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.894, "r_x1": 286.365, "r_y1": 119.894, "r_x2": 286.365, "r_y2": 111.34199999999998, "r_x3": 50.112, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.84900000000005, "r_x1": 135.691, "r_y1": 131.84900000000005, "r_x2": 135.691, "r_y2": 123.29700000000003, "r_x3": 50.112, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "of objects may exist.", "orig": "of objects may exist.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.047, "r_y0": 131.84900000000005, "r_x1": 286.365, "r_y1": 131.84900000000005, "r_x2": 286.365, "r_y2": 123.29700000000003, "r_x3": 142.047, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "In our case, we know up front that", "orig": "In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.80499999999995, "r_x1": 286.365, "r_y1": 143.80499999999995, "r_x2": 286.365, "r_y2": 135.25300000000004, "r_x3": 50.112, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.76, "r_x1": 175.163, "r_y1": 155.76, "r_x2": 175.163, "r_y2": 147.20799999999997, "r_x3": 50.112, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.275, "r_y0": 168.44500000000005, "r_x1": 144.806, "r_y1": 168.44500000000005, "r_x2": 144.806, "r_y2": 159.89300000000003, "r_x3": 113.275, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "features", "orig": "features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.937, "r_y0": 168.44500000000005, "r_x1": 161.554, "r_y1": 168.44500000000005, "r_x2": 161.554, "r_y2": 159.89300000000003, "r_x3": 149.937, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.684, "r_y0": 168.44500000000005, "r_x1": 184.936, "r_y1": 168.44500000000005, "r_x2": 184.936, "r_y2": 159.89300000000003, "r_x3": 166.684, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "each", "orig": "each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.057, "r_y0": 168.44500000000005, "r_x1": 209.424, "r_y1": 168.44500000000005, "r_x2": 209.424, "r_y2": 159.89300000000003, "r_x3": 190.057, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.555, "r_y0": 168.44500000000005, "r_x1": 228.941, "r_y1": 168.44500000000005, "r_x2": 228.941, "r_y2": 159.89300000000003, "r_x3": 214.555, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.061, "r_y0": 168.44500000000005, "r_x1": 246.226, "r_y1": 168.44500000000005, "r_x2": 246.226, "r_y2": 159.89300000000003, "r_x3": 234.061, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.356, "r_y0": 168.44500000000005, "r_x1": 268.512, "r_y1": 168.44500000000005, "r_x2": 268.512, "r_y2": 159.89300000000003, "r_x3": 251.356, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "then", "orig": "then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.643, "r_y0": 168.44500000000005, "r_x1": 286.365, "r_y1": 168.44500000000005, "r_x2": 286.365, "r_y2": 159.89300000000003, "r_x3": 273.643, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "fed", "orig": "fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.40099999999995, "r_x1": 65.614, "r_y1": 180.40099999999995, "r_x2": 65.614, "r_y2": 171.84900000000005, "r_x3": 50.112, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "into", "orig": "into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.107, "r_y0": 180.40099999999995, "r_x1": 82.281, "r_y1": 180.40099999999995, "r_x2": 82.281, "r_y2": 171.84900000000005, "r_x3": 70.107, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.764, "r_y0": 180.40099999999995, "r_x1": 138.66, "r_y1": 180.40099999999995, "r_x2": 138.66, "r_y2": 171.84900000000005, "r_x3": 86.764, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "feed-forward", "orig": "feed-forward", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.153, "r_y0": 180.40099999999995, "r_x1": 286.365, "r_y1": 180.40099999999995, "r_x2": 286.365, "r_y2": 171.84900000000005, "r_x3": 143.153, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "network (FFN). The FFN consists", "orig": "network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.356, "r_x1": 286.365, "r_y1": 192.356, "r_x2": 286.365, "r_y2": 183.80399999999997, "r_x3": 50.112, "r_y3": 183.80399999999997, "coord_origin": "TOPLEFT"}, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.31100000000004, "r_x1": 286.365, "r_y1": 204.31100000000004, "r_x2": 286.365, "r_y2": 195.75900000000001, "r_x3": 50.112, "r_y3": 195.75900000000001, "coord_origin": "TOPLEFT"}, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 216.26599999999996, "r_x1": 196.004, "r_y1": 216.26599999999996, "r_x2": 196.004, "r_y2": 207.71400000000006, "r_x3": 50.112, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table cell.", "orig": "the bounding box of each table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.786, "r_y0": 216.26599999999996, "r_x1": 286.365, "r_y1": 216.26599999999996, "r_x2": 286.365, "r_y2": 207.71400000000006, "r_x3": 200.786, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "Finally, the predicted", "orig": "Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 228.221, "r_x1": 286.365, "r_y1": 228.221, "r_x2": 286.365, "r_y2": 219.66899999999998, "r_x3": 50.112, "r_y3": 219.66899999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 240.17700000000002, "r_x1": 181.549, "r_y1": 240.17700000000002, "r_x2": 181.549, "r_y2": 231.625, "r_x3": 50.112, "r_y3": 231.625, "coord_origin": "TOPLEFT"}, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.451, "r_y0": 252.86199999999997, "r_x1": 276.139, "r_y1": 252.86199999999997, "r_x2": 276.139, "r_y2": 244.30999999999995, "r_x3": 134.451, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "We formulate a multi-task loss Eq.", "orig": "We formulate a multi-task loss Eq.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.379, "r_y0": 252.86199999999997, "r_x1": 286.361, "r_y1": 252.86199999999997, "r_x2": 286.361, "r_y2": 244.30999999999995, "r_x3": 281.379, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.817, "r_x1": 134.685, "r_y1": 264.817, "r_x2": 134.685, "r_y2": 256.265, "r_x3": 50.112, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "to train our network.", "orig": "to train our network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.543, "r_y0": 264.817, "r_x1": 286.365, "r_y1": 264.817, "r_x2": 286.365, "r_y2": 256.265, "r_x3": 140.543, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "The Cross-Entropy loss (denoted as", "orig": "The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.60900000000004, "r_x1": 53.085, "r_y1": 276.60900000000004, "r_x2": 53.085, "r_y2": 267.903, "r_x3": 50.112, "r_y3": 267.903, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.085, "r_y0": 277.53200000000004, "r_x1": 56.845, "r_y1": 277.53200000000004, "r_x2": 56.845, "r_y2": 271.438, "r_x3": 53.085, "r_y3": 271.438, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 57.343, "r_y0": 276.773, "r_x1": 135.4, "r_y1": 276.773, "r_x2": 135.4, "r_y2": 268.221, "r_x3": 57.343, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.735, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04200000000003, "r_x3": 137.735, "r_y3": 268.04200000000003, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.637, "r_y0": 276.773, "r_x1": 286.364, "r_y1": 276.773, "r_x2": 286.364, "r_y2": 268.221, "r_x3": 213.637, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.728, "r_x1": 158.824, "r_y1": 288.728, "r_x2": 158.824, "r_y2": 280.176, "r_x3": 50.112, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.318, "r_y0": 288.585, "r_x1": 238.797, "r_y1": 288.585, "r_x2": 238.797, "r_y2": 279.99699999999996, "r_x3": 161.318, "r_y3": 279.99699999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.521, "r_y0": 288.728, "r_x1": 286.363, "r_y1": 288.728, "r_x2": 286.363, "r_y2": 280.176, "r_x3": 241.521, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.683, "r_x1": 211.377, "r_y1": 300.683, "r_x2": 211.377, "r_y2": 292.131, "r_x3": 50.112, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.271, "r_y0": 300.519, "r_x1": 217.244, "r_y1": 300.519, "r_x2": 217.244, "r_y2": 291.813, "r_x3": 214.271, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.244, "r_y0": 301.442, "r_x1": 229.198, "r_y1": 301.442, "r_x2": 229.198, "r_y2": 295.348, "r_x3": 217.244, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.696, "r_y0": 300.683, "r_x1": 232.187, "r_y1": 300.683, "r_x2": 232.187, "r_y2": 292.131, "r_x3": 229.696, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.49, "r_y0": 300.519, "r_x1": 239.463, "r_y1": 300.519, "r_x2": 239.463, "r_y2": 291.813, "r_x3": 236.49, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.463, "r_y0": 301.442, "r_x1": 251.417, "r_y1": 301.442, "r_x2": 251.417, "r_y2": 295.348, "r_x3": 239.463, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.811, "r_y0": 300.683, "r_x1": 286.363, "r_y1": 300.683, "r_x2": 286.363, "r_y2": 292.131, "r_x3": 254.811, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.638, "r_x1": 137.454, "r_y1": 312.638, "r_x2": 137.454, "r_y2": 304.086, "r_x3": 50.112, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.298, "r_y0": 312.474, "r_x1": 144.271, "r_y1": 312.474, "r_x2": 144.271, "r_y2": 303.768, "r_x3": 141.298, "r_y3": 303.768, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.271, "r_y0": 313.398, "r_x1": 148.243, "r_y1": 313.398, "r_x2": 148.243, "r_y2": 307.304, "r_x3": 144.271, "r_y3": 307.304, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.586, "r_y0": 312.638, "r_x1": 286.364, "r_y1": 312.638, "r_x2": 286.364, "r_y2": 304.086, "r_x3": 152.586, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.593, "r_x1": 89.683, "r_y1": 324.593, "r_x2": 89.683, "r_y2": 316.041, "r_x3": 50.112, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.686, "r_y0": 324.429, "r_x1": 92.659, "r_y1": 324.429, "r_x2": 92.659, "r_y2": 315.723, "r_x3": 89.686, "r_y3": 315.723, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.659, "r_y0": 325.353, "r_x1": 104.12, "r_y1": 325.353, "r_x2": 104.12, "r_y2": 319.259, "r_x3": 92.659, "r_y3": 319.259, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.618, "r_y0": 324.593, "r_x1": 286.366, "r_y1": 324.593, "r_x2": 286.366, "r_y2": 316.041, "r_x3": 104.618, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.549, "r_x1": 286.365, "r_y1": 336.549, "r_x2": 286.365, "r_y2": 327.997, "r_x3": 50.112, "r_y3": 327.997, "coord_origin": "TOPLEFT"}, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.504, "r_x1": 286.365, "r_y1": 348.504, "r_x2": 286.365, "r_y2": 339.952, "r_x3": 50.112, "r_y3": 339.952, "coord_origin": "TOPLEFT"}, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.459, "r_x1": 286.365, "r_y1": 360.459, "r_x2": 286.365, "r_y2": 351.907, "r_x3": 50.112, "r_y3": 351.907, "coord_origin": "TOPLEFT"}, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.414, "r_x1": 286.365, "r_y1": 372.414, "r_x2": 286.365, "r_y2": 363.862, "r_x3": 50.112, "r_y3": 363.862, "coord_origin": "TOPLEFT"}, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.369, "r_x1": 286.365, "r_y1": 384.369, "r_x2": 286.365, "r_y2": 375.817, "r_x3": 50.112, "r_y3": 375.817, "coord_origin": "TOPLEFT"}, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.324, "r_x1": 286.365, "r_y1": 396.324, "r_x2": 286.365, "r_y2": 387.772, "r_x3": 50.112, "r_y3": 387.772, "coord_origin": "TOPLEFT"}, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.28, "r_x1": 88.687, "r_y1": 408.28, "r_x2": 88.687, "r_y2": 399.728, "r_x3": 50.112, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.646, "r_y0": 408.137, "r_x1": 170.052, "r_y1": 408.137, "r_x2": 170.052, "r_y2": 399.549, "r_x3": 91.646, "r_y3": 399.549, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.051, "r_y0": 408.28, "r_x1": 172.542, "r_y1": 408.28, "r_x2": 172.542, "r_y2": 399.728, "r_x3": 170.051, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.62, "r_y0": 408.28, "r_x1": 286.364, "r_y1": 408.28, "r_x2": 286.364, "r_y2": 399.728, "r_x3": 175.62, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "and 2) Our bounding boxes", "orig": "and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.235, "r_x1": 181.967, "r_y1": 420.235, "r_x2": 181.967, "r_y2": 411.683, "r_x3": 50.112, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.09, "r_y0": 420.235, "r_x1": 286.365, "r_y1": 420.235, "r_x2": 286.365, "r_y2": 411.683, "r_x3": 189.09, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "3) ensures a one-to-one", "orig": "3) ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.19, "r_x1": 286.365, "r_y1": 432.19, "r_x2": 286.365, "r_y2": 423.638, "r_x3": 50.112, "r_y3": 423.638, "coord_origin": "TOPLEFT"}, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.145, "r_x1": 158.296, "r_y1": 444.145, "r_x2": 158.296, "r_y2": 435.593, "r_x3": 50.112, "r_y3": 435.593, "coord_origin": "TOPLEFT"}, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 468.786, "r_x1": 91.377, "r_y1": 468.786, "r_x2": 91.377, "r_y2": 460.234, "r_x3": 50.112, "r_y3": 460.234, "coord_origin": "TOPLEFT"}, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.688, "r_y0": 503.02, "r_x1": 140.642, "r_y1": 503.02, "r_x2": 140.642, "r_y2": 496.926, "r_x3": 128.688, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.907, "r_y0": 502.097, "r_x1": 151.656, "r_y1": 502.097, "r_x2": 151.656, "r_y2": 493.391, "r_x3": 143.907, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.423, "r_y0": 502.097, "r_x1": 160.234, "r_y1": 502.097, "r_x2": 160.234, "r_y2": 493.391, "r_x3": 154.423, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.235, "r_y0": 503.02, "r_x1": 186.628, "r_y1": 503.02, "r_x2": 186.628, "r_y2": 496.926, "r_x3": 160.235, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "iou iou", "orig": "iou iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.194, "r_y0": 502.097, "r_x1": 175.167, "r_y1": 502.097, "r_x2": 175.167, "r_y2": 493.391, "r_x3": 172.194, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.34, "r_y0": 502.097, "r_x1": 197.089, "r_y1": 502.097, "r_x2": 197.089, "r_y2": 493.391, "r_x3": 189.34, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.303, "r_y0": 502.097, "r_x1": 205.114, "r_y1": 502.097, "r_x2": 205.114, "r_y2": 493.391, "r_x3": 199.303, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.115, "r_y0": 503.02, "r_x1": 207.635, "r_y1": 503.02, "r_x2": 207.635, "r_y2": 496.926, "r_x3": 205.115, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.675, "r_y0": 503.02, "r_x1": 211.647, "r_y1": 503.02, "r_x2": 211.647, "r_y2": 496.926, "r_x3": 207.675, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.33, "r_y0": 517.0409999999999, "r_x1": 127.303, "r_y1": 517.0409999999999, "r_x2": 127.303, "r_y2": 508.335, "r_x3": 124.33, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.266, "r_y0": 517.0409999999999, "r_x1": 138.015, "r_y1": 517.0409999999999, "r_x2": 138.015, "r_y2": 508.335, "r_x3": 130.266, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.782, "r_y0": 517.0409999999999, "r_x1": 149.566, "r_y1": 517.0409999999999, "r_x2": 149.566, "r_y2": 508.335, "r_x3": 140.782, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bbl", "orig": "\u03bbl", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.566, "r_y0": 517.9639999999999, "r_x1": 153.326, "r_y1": 517.9639999999999, "r_x2": 153.326, "r_y2": 511.87, "r_x3": 149.566, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.039, "r_y0": 517.0409999999999, "r_x1": 174.855, "r_y1": 517.0409999999999, "r_x2": 174.855, "r_y2": 508.335, "r_x3": 156.039, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "+(1", "orig": "+(1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.071, "r_y0": 516.899, "r_x1": 184.82, "r_y1": 516.899, "r_x2": 184.82, "r_y2": 508.335, "r_x3": 177.071, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.033, "r_y0": 517.0409999999999, "r_x1": 199.692, "r_y1": 517.0409999999999, "r_x2": 199.692, "r_y2": 508.335, "r_x3": 187.033, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bb l", "orig": "\u03bb l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.845, "r_y0": 517.0409999999999, "r_x1": 196.719, "r_y1": 517.0409999999999, "r_x2": 196.719, "r_y2": 508.335, "r_x3": 192.845, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.692, "r_y0": 517.9639999999999, "r_x1": 211.646, "r_y1": 517.9639999999999, "r_x2": 211.646, "r_y2": 511.87, "r_x3": 199.692, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 509.832, "r_x1": 286.362, "r_y1": 509.832, "r_x2": 286.362, "r_y2": 501.28, "r_x3": 274.746, "r_y3": 501.28, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.941, "r_y0": 539.966, "r_x1": 82.752, "r_y1": 539.966, "r_x2": 82.752, "r_y2": 531.26, "r_x3": 76.941, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.52, "r_y0": 539.8240000000001, "r_x1": 92.162, "r_y1": 539.8240000000001, "r_x2": 92.162, "r_y2": 531.26, "r_x3": 85.52, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.653, "r_y0": 540.13, "r_x1": 135.599, "r_y1": 540.13, "r_x2": 135.599, "r_y2": 531.578, "r_x3": 94.653, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.09, "r_y0": 539.966, "r_x1": 143.901, "r_y1": 539.966, "r_x2": 143.901, "r_y2": 531.26, "r_x3": 138.09, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.901, "r_y0": 540.889, "r_x1": 155.362, "r_y1": 540.889, "r_x2": 155.362, "r_y2": 534.7950000000001, "r_x3": 143.901, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 539.966, "r_x1": 166.104, "r_y1": 539.966, "r_x2": 166.104, "r_y2": 531.26, "r_x3": 155.861, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": ", \u03bb", "orig": ", \u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.1, "r_y0": 540.889, "r_x1": 168.62, "r_y1": 540.889, "r_x2": 168.62, "r_y2": 534.7950000000001, "r_x3": 166.1, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.66, "r_y0": 540.889, "r_x1": 172.632, "r_y1": 540.889, "r_x2": 172.632, "r_y2": 534.7950000000001, "r_x3": 168.66, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.897, "r_y0": 539.8240000000001, "r_x1": 182.539, "r_y1": 539.8240000000001, "r_x2": 182.539, "r_y2": 531.26, "r_x3": 175.897, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.306, "r_y0": 538.064, "r_x1": 192.501, "r_y1": 538.064, "r_x2": 192.501, "r_y2": 533.441, "r_x3": 185.306, "r_y3": 533.441, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.992, "r_y0": 540.13, "r_x1": 281.597, "r_y1": 540.13, "r_x2": 281.597, "r_y2": 531.578, "r_x3": 194.992, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.384, "r_y0": 604.412, "r_x1": 286.36, "r_y1": 604.412, "r_x2": 286.36, "r_y2": 595.8240000000001, "r_x3": 205.384, "r_y3": 595.8240000000001, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 616.367, "r_x1": 70.037, "r_y1": 616.367, "r_x2": 70.037, "r_y2": 607.779, "r_x3": 50.112, "r_y3": 607.779, "coord_origin": "TOPLEFT"}, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 616.51, "r_x1": 72.528, "r_y1": 616.51, "r_x2": 72.528, "r_y2": 607.958, "r_x3": 70.037, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.14, "r_y0": 616.51, "r_x1": 286.365, "r_y1": 616.51, "r_x2": 286.365, "r_y2": 607.958, "r_x3": 77.14, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": "The input images are resized to 448*448 pixels and", "orig": "The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 628.465, "r_x1": 286.365, "r_y1": 628.465, "r_x2": 286.365, "r_y2": 619.913, "r_x3": 50.112, "r_y3": 619.913, "coord_origin": "TOPLEFT"}, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 640.421, "r_x1": 207.033, "r_y1": 640.421, "r_x2": 207.033, "r_y2": 631.869, "r_x3": 50.112, "r_y3": 631.869, "coord_origin": "TOPLEFT"}, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.507, "r_y0": 663.06, "r_x1": 196.256, "r_y1": 663.06, "r_x2": 196.256, "r_y2": 654.496, "r_x3": 188.507, "r_y3": 654.496, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.746, "r_y0": 663.366, "r_x1": 244.813, "r_y1": 663.366, "r_x2": 244.813, "r_y2": 654.814, "r_x3": 198.746, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.016, "r_y0": 678.31, "r_x1": 186.246, "r_y1": 678.31, "r_x2": 186.246, "r_y2": 669.758, "r_x3": 101.016, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.736, "r_y0": 678.004, "r_x1": 196.485, "r_y1": 678.004, "r_x2": 196.485, "r_y2": 669.44, "r_x3": 188.736, "r_y3": 669.44, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.975, "r_y0": 678.31, "r_x1": 244.813, "r_y1": 678.31, "r_x2": 244.813, "r_y2": 669.758, "r_x3": 198.975, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 670.938, "r_x1": 286.362, "r_y1": 670.938, "r_x2": 286.362, "r_y2": 662.386, "r_x3": 274.746, "r_y3": 662.386, "coord_origin": "TOPLEFT"}, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 339.985, "r_y1": 95.98400000000004, "r_x2": 339.985, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.889, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 346.889, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 492.961, "r_y1": 107.93899999999996, "r_x2": 492.961, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 137.005, "r_x1": 545.115, "r_y1": 137.005, "r_x2": 545.115, "r_y2": 128.45299999999997, "r_x3": 308.862, "r_y3": 128.45299999999997, "coord_origin": "TOPLEFT"}, "text": "Encoder Layers', with an input feature size of 512, feed", "orig": "Encoder Layers', with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 148.96000000000004, "r_x1": 545.115, "r_y1": 148.96000000000004, "r_x2": 545.115, "r_y2": 140.40800000000002, "r_x3": 308.862, "r_y3": 140.40800000000002, "coord_origin": "TOPLEFT"}, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 160.91499999999996, "r_x1": 545.115, "r_y1": 160.91499999999996, "r_x2": 545.115, "r_y2": 152.36300000000006, "r_x3": 308.862, "r_y3": 152.36300000000006, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder it is composed of four 'Transformer", "orig": "Transformer Decoder it is composed of four 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 172.87, "r_x1": 545.115, "r_y1": 172.87, "r_x2": 545.115, "r_y2": 164.31799999999998, "r_x3": 308.862, "r_y3": 164.31799999999998, "coord_origin": "TOPLEFT"}, "text": "Decoder Layers' with similar input and output dimensions", "orig": "Decoder Layers' with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 184.82600000000002, "r_x1": 317.161, "r_y1": 184.82600000000002, "r_x2": 317.161, "r_y2": 176.274, "r_x3": 308.862, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.365, "r_y0": 184.82600000000002, "r_x1": 333.539, "r_y1": 184.82600000000002, "r_x2": 333.539, "r_y2": 176.274, "r_x3": 321.365, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.734, "r_y0": 184.82600000000002, "r_x1": 467.218, "r_y1": 184.82600000000002, "r_x2": 467.218, "r_y2": 176.274, "r_x3": 337.734, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "'Transformer Encoder Layers'.", "orig": "'Transformer Encoder Layers'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.437, "r_y0": 184.82600000000002, "r_x1": 545.115, "r_y1": 184.82600000000002, "r_x2": 545.115, "r_y2": 176.274, "r_x3": 475.437, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 196.78099999999995, "r_x1": 545.115, "r_y1": 196.78099999999995, "r_x2": 545.115, "r_y2": 188.22900000000004, "r_x3": 308.862, "r_y3": 188.22900000000004, "coord_origin": "TOPLEFT"}, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 208.736, "r_x1": 399.213, "r_y1": 208.736, "r_x2": 399.213, "r_y2": 200.18399999999997, "r_x3": 308.862, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "mentation parameters,", "orig": "mentation parameters,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.965, "r_y0": 208.736, "r_x1": 458.63, "r_y1": 208.736, "r_x2": 458.63, "r_y2": 200.18399999999997, "r_x3": 403.965, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "our extensive", "orig": "our extensive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 462.934, "r_y0": 208.736, "r_x1": 545.115, "r_y1": 208.736, "r_x2": 545.115, "r_y2": 200.18399999999997, "r_x3": 462.934, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "experimentation has", "orig": "experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 220.69100000000003, "r_x1": 527.84, "r_y1": 220.69100000000003, "r_x2": 527.84, "r_y2": 212.139, "r_x3": 308.862, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "proved this setup to be more suitable for table images.", "orig": "proved this setup to be more suitable for table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.084, "r_y0": 220.69100000000003, "r_x1": 545.115, "r_y1": 220.69100000000003, "r_x2": 545.115, "r_y2": 212.139, "r_x3": 532.084, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "We", "orig": "We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.64599999999996, "r_x1": 341.868, "r_y1": 232.64599999999996, "r_x2": 341.868, "r_y2": 224.09400000000005, "r_x3": 308.862, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "attribute", "orig": "attribute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 232.64599999999996, "r_x1": 360.767, "r_y1": 232.64599999999996, "r_x2": 360.767, "r_y2": 224.09400000000005, "r_x3": 346.371, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.27, "r_y0": 232.64599999999996, "r_x1": 393.504, "r_y1": 232.64599999999996, "r_x2": 393.504, "r_y2": 224.09400000000005, "r_x3": 365.27, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.007, "r_y0": 232.64599999999996, "r_x1": 405.758, "r_y1": 232.64599999999996, "r_x2": 405.758, "r_y2": 224.09400000000005, "r_x3": 398.007, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.261, "r_y0": 232.64599999999996, "r_x1": 422.436, "r_y1": 232.64599999999996, "r_x2": 422.436, "r_y2": 224.09400000000005, "r_x3": 410.261, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 232.64599999999996, "r_x1": 459.586, "r_y1": 232.64599999999996, "r_x2": 459.586, "r_y2": 224.09400000000005, "r_x3": 426.939, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "inherent", "orig": "inherent", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.089, "r_y0": 232.64599999999996, "r_x1": 490.102, "r_y1": 232.64599999999996, "r_x2": 490.102, "r_y2": 224.09400000000005, "r_x3": 464.089, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "design", "orig": "design", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.605, "r_y0": 232.64599999999996, "r_x1": 502.904, "r_y1": 232.64599999999996, "r_x2": 502.904, "r_y2": 224.09400000000005, "r_x3": 494.605, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 507.407, "r_y0": 232.64599999999996, "r_x1": 526.774, "r_y1": 232.64599999999996, "r_x2": 526.774, "r_y2": 224.09400000000005, "r_x3": 507.407, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.277, "r_y0": 232.64599999999996, "r_x1": 545.115, "r_y1": 232.64599999999996, "r_x2": 545.115, "r_y2": 224.09400000000005, "r_x3": 531.277, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "im-", "orig": "im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 244.601, "r_x1": 545.115, "r_y1": 244.601, "r_x2": 545.115, "r_y2": 236.04899999999998, "r_x3": 308.862, "r_y3": 236.04899999999998, "coord_origin": "TOPLEFT"}, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.557, "r_x1": 496.169, "r_y1": 256.557, "r_x2": 496.169, "r_y2": 248.005, "r_x3": 308.862, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "elaborate content present in other scopes (e.g.", "orig": "elaborate content present in other scopes (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.897, "r_y0": 256.557, "r_x1": 545.115, "r_y1": 256.557, "r_x2": 545.115, "r_y2": 248.005, "r_x3": 501.897, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "the COCO", "orig": "the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.51199999999994, "r_x1": 342.336, "r_y1": 268.51199999999994, "r_x2": 342.336, "r_y2": 259.96000000000004, "r_x3": 308.862, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.952, "r_y0": 268.51199999999994, "r_x1": 545.115, "r_y1": 268.51199999999994, "r_x2": 545.115, "r_y2": 259.96000000000004, "r_x3": 348.952, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.467, "r_x1": 545.115, "r_y1": 280.467, "r_x2": 545.115, "r_y2": 271.91499999999996, "r_x3": 308.862, "r_y3": 271.91499999999996, "coord_origin": "TOPLEFT"}, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.422, "r_x1": 545.115, "r_y1": 292.422, "r_x2": 545.115, "r_y2": 283.87, "r_x3": 308.862, "r_y3": 283.87, "coord_origin": "TOPLEFT"}, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.377, "r_x1": 545.115, "r_y1": 304.377, "r_x2": 545.115, "r_y2": 295.825, "r_x3": 308.862, "r_y3": 295.825, "coord_origin": "TOPLEFT"}, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.332, "r_x1": 545.115, "r_y1": 316.332, "r_x2": 545.115, "r_y2": 307.78, "r_x3": 308.862, "r_y3": 307.78, "coord_origin": "TOPLEFT"}, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.288, "r_x1": 532.483, "r_y1": 328.288, "r_x2": 532.483, "r_y2": 319.736, "r_x3": 308.862, "r_y3": 319.736, "coord_origin": "TOPLEFT"}, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 357.353, "r_x1": 403.736, "r_y1": 357.353, "r_x2": 403.736, "r_y2": 348.801, "r_x3": 308.862, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.076, "r_y0": 357.21, "r_x1": 545.112, "r_y1": 357.21, "r_x2": 545.112, "r_y2": 348.622, "r_x3": 406.076, "r_y3": 348.622, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network Structure", "orig": "CNN Backbone Network Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 503.539, "r_y0": 357.353, "r_x1": 506.03, "r_y1": 357.353, "r_x2": 506.03, "r_y2": 348.801, "r_x3": 503.539, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 369.165, "r_x1": 343.163, "r_y1": 369.165, "r_x2": 343.163, "r_y2": 360.577, "r_x3": 308.862, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.163, "r_y0": 369.308, "r_x1": 362.202, "r_y1": 369.308, "r_x2": 362.202, "r_y2": 360.756, "r_x3": 343.163, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.286, "r_y0": 369.165, "r_x1": 440.938, "r_y1": 369.165, "r_x2": 440.938, "r_y2": 360.577, "r_x3": 364.286, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.939, "r_y0": 369.308, "r_x1": 443.43, "r_y1": 369.308, "r_x2": 443.43, "r_y2": 360.756, "r_x3": 440.939, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.379, "r_y0": 369.308, "r_x1": 545.108, "r_y1": 369.308, "r_x2": 545.108, "r_y2": 360.756, "r_x3": 446.379, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": "Taking the PubTabNet as", "orig": "Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 381.263, "r_x1": 545.115, "r_y1": 381.263, "r_x2": 545.115, "r_y2": 372.711, "r_x3": 308.862, "r_y3": 372.711, "coord_origin": "TOPLEFT"}, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 393.219, "r_x1": 545.115, "r_y1": 393.219, "r_x2": 545.115, "r_y2": 384.667, "r_x3": 308.862, "r_y3": 384.667, "coord_origin": "TOPLEFT"}, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 405.01, "r_x1": 314.673, "r_y1": 405.01, "r_x2": 314.673, "r_y2": 396.304, "r_x3": 308.862, "r_y3": 396.304, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.658, "r_y0": 405.174, "r_x1": 329.726, "r_y1": 405.174, "r_x2": 329.726, "r_y2": 396.622, "r_x3": 318.658, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.711, "r_y0": 405.174, "r_x1": 341.462, "r_y1": 405.174, "r_x2": 341.462, "r_y2": 396.622, "r_x3": 333.711, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.447, "r_y0": 405.174, "r_x1": 360.391, "r_y1": 405.174, "r_x2": 360.391, "r_y2": 396.622, "r_x3": 345.447, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "0.5.", "orig": "0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.963, "r_y0": 405.174, "r_x1": 415.166, "r_y1": 405.174, "r_x2": 415.166, "r_y2": 396.622, "r_x3": 367.963, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "Afterwards,", "orig": "Afterwards,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 419.519, "r_y0": 405.174, "r_x1": 545.108, "r_y1": 405.174, "r_x2": 545.108, "r_y2": 396.622, "r_x3": 419.519, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "we reduce the learning rate to", "orig": "we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 417.129, "r_x1": 545.115, "r_y1": 417.129, "r_x2": 545.115, "r_y2": 408.577, "r_x3": 308.862, "r_y3": 408.577, "coord_origin": "TOPLEFT"}, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 429.084, "r_x1": 360.966, "r_y1": 429.084, "r_x2": 360.966, "r_y2": 420.532, "r_x3": 308.862, "r_y3": 420.532, "coord_origin": "TOPLEFT"}, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 458.15, "r_x1": 384.628, "r_y1": 458.15, "r_x2": 384.628, "r_y2": 449.598, "r_x3": 308.862, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.372, "r_y0": 458.15, "r_x1": 545.115, "r_y1": 458.15, "r_x2": 545.115, "r_y2": 449.598, "r_x3": 391.372, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 470.105, "r_x1": 494.007, "r_y1": 470.105, "r_x2": 494.007, "r_y2": 461.553, "r_x3": 308.862, "r_y3": 461.553, "coord_origin": "TOPLEFT"}, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.078, "r_y0": 469.962, "r_x1": 545.111, "r_y1": 469.962, "r_x2": 545.111, "r_y2": 461.374, "r_x3": 498.078, "r_y3": 461.374, "coord_origin": "TOPLEFT"}, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 481.917, "r_x1": 364.443, "r_y1": 481.917, "r_x2": 364.443, "r_y2": 473.329, "r_x3": 308.862, "r_y3": 473.329, "coord_origin": "TOPLEFT"}, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.061, "r_y0": 482.06, "r_x1": 545.113, "r_y1": 482.06, "r_x2": 545.113, "r_y2": 473.508, "r_x3": 367.061, "r_y3": 473.508, "coord_origin": "TOPLEFT"}, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 494.015, "r_x1": 545.115, "r_y1": 494.015, "r_x2": 545.115, "r_y2": 485.463, "r_x3": 308.862, "r_y3": 485.463, "coord_origin": "TOPLEFT"}, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 505.97, "r_x1": 545.115, "r_y1": 505.97, "r_x2": 545.115, "r_y2": 497.418, "r_x3": 308.862, "r_y3": 497.418, "coord_origin": "TOPLEFT"}, "text": "step. Similarly, we employ a 'caching' technique to preform", "orig": "step. Similarly, we employ a 'caching' technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 517.9259999999999, "r_x1": 432.588, "r_y1": 517.9259999999999, "r_x2": 432.588, "r_y2": 509.374, "r_x3": 308.862, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "faster autoregressive decoding.", "orig": "faster autoregressive decoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 517.9259999999999, "r_x1": 545.115, "r_y1": 517.9259999999999, "r_x2": 545.115, "r_y2": 509.374, "r_x3": 436.732, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "This is achieved by storing", "orig": "This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 529.881, "r_x1": 545.115, "r_y1": 529.881, "r_x2": 545.115, "r_y2": 521.329, "r_x3": 308.862, "r_y3": 521.329, "coord_origin": "TOPLEFT"}, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 541.836, "r_x1": 370.062, "r_y1": 541.836, "r_x2": 370.062, "r_y2": 533.284, "r_x3": 308.862, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "each time step.", "orig": "each time step.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.721, "r_y0": 541.836, "r_x1": 545.115, "r_y1": 541.836, "r_x2": 545.115, "r_y2": 533.284, "r_x3": 375.721, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "Therefore, we only compute the attention", "orig": "Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 553.7909999999999, "r_x1": 377.215, "r_y1": 553.7909999999999, "r_x2": 377.215, "r_y2": 545.239, "r_x3": 308.862, "r_y3": 545.239, "coord_origin": "TOPLEFT"}, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 624.225, "r_x1": 545.115, "r_y1": 624.225, "r_x2": 545.115, "r_y2": 615.673, "r_x3": 308.862, "r_y3": 615.673, "coord_origin": "TOPLEFT"}, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 636.1800000000001, "r_x1": 545.115, "r_y1": 636.1800000000001, "r_x2": 545.115, "r_y2": 627.6279999999999, "r_x3": 308.862, "r_y3": 627.6279999999999, "coord_origin": "TOPLEFT"}, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 648.135, "r_x1": 545.115, "r_y1": 648.135, "r_x2": 545.115, "r_y2": 639.583, "r_x3": 308.862, "r_y3": 639.583, "coord_origin": "TOPLEFT"}, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 660.091, "r_x1": 545.115, "r_y1": 660.091, "r_x2": 545.115, "r_y2": 651.539, "r_x3": 308.862, "r_y3": 651.539, "coord_origin": "TOPLEFT"}, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 672.046, "r_x1": 350.705, "r_y1": 672.046, "r_x2": 350.705, "r_y2": 663.494, "r_x3": 308.862, "r_y3": 663.494, "coord_origin": "TOPLEFT"}, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 361.196, "r_y1": 701.111, "r_x2": 361.196, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.057, "r_y0": 701.111, "r_x1": 396.214, "r_y1": 701.111, "r_x2": 396.214, "r_y2": 692.559, "r_x3": 366.057, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.406, "r_y0": 701.111, "r_x1": 453.449, "r_y1": 701.111, "r_x2": 453.449, "r_y2": 692.559, "r_x3": 406.406, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Throughout", "orig": "Throughout", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.311, "r_y0": 701.111, "r_x1": 471.591, "r_y1": 701.111, "r_x2": 471.591, "r_y2": 692.559, "r_x3": 458.311, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.453, "r_y0": 701.111, "r_x1": 527.481, "r_y1": 701.111, "r_x2": 527.481, "r_y2": 692.559, "r_x3": 476.453, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "experiments,", "orig": "experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.941, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 532.941, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.067, "r_x1": 495.94, "r_y1": 713.067, "r_x2": 495.94, "r_y2": 704.515, "r_x3": 308.862, "r_y3": 704.515, "coord_origin": "TOPLEFT"}, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9868090152740479, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9799237847328186, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 116.49800000000005, "r": 545.115, "b": 125.04999999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9880930781364441, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "text", "bbox": {"l": 62.067, "t": 159.89300000000003, "r": 108.154, "b": 168.44500000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9860327839851379, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 243.92200000000003, "r": 129.215, "b": 252.87800000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9873637557029724, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 336.846, "r": 545.115, "b": 345.398, "coord_origin": "TOPLEFT"}, "confidence": 0.9877589344978333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 437.643, "r": 545.115, "b": 446.195, "coord_origin": "TOPLEFT"}, "confidence": 0.9884491562843323, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 448.279, "r": 286.365, "b": 456.831, "coord_origin": "TOPLEFT"}, "confidence": 0.9724196195602417, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "formula", "bbox": {"l": 125.715, "t": 493.391, "r": 128.688, "b": 502.097, "coord_origin": "TOPLEFT"}, "confidence": 0.9423348307609558, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 531.578, "r": 74.451, "b": 540.13, "coord_origin": "TOPLEFT"}, "confidence": 0.9363929629325867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 555.917, "r": 171.983, "b": 566.665, "coord_origin": "TOPLEFT"}, "confidence": 0.9554555416107178, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 576.264, "r": 179.175, "b": 586.116, "coord_origin": "TOPLEFT"}, "confidence": 0.9538503289222717, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "section_header", "bbox": {"l": 308.862, "t": 579.554, "r": 397.443, "b": 589.406, "coord_origin": "TOPLEFT"}, "confidence": 0.9450808763504028, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 62.067, "t": 596.0029999999999, "r": 202.978, "b": 604.5550000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9856163263320923, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 603.718, "r": 545.115, "b": 612.27, "coord_origin": "TOPLEFT"}, "confidence": 0.9880595803260803, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "formula", "bbox": {"l": 91.661, "t": 654.814, "r": 186.017, "b": 663.366, "coord_origin": "TOPLEFT"}, "confidence": 0.844183623790741, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "text", "bbox": {"l": 320.817, "t": 680.604, "r": 545.115, "b": 689.156, "coord_origin": "TOPLEFT"}, "confidence": 0.9830910563468933, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.9724979996681213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8820409178733826, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 5, "page_no": 5, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9868090152740479, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tention encoding is then multiplied to the encoded image to"}, {"label": "text", "id": 9, "page_no": 5, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9799237847328186, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "runtime performance and lower memory footprint of Table-"}, {"label": "text", "id": 1, "page_no": 5, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 116.49800000000005, "r": 545.115, "b": 125.04999999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9880930781364441, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Transformer Encoder consists of two 'Transformer"}, {"label": "text", "id": 6, "page_no": 5, "cluster": {"id": 6, "label": "text", "bbox": {"l": 62.067, "t": 159.89300000000003, "r": 108.154, "b": 168.44500000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9860327839851379, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The output"}, {"label": "text", "id": 4, "page_no": 5, "cluster": {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 243.92200000000003, "r": 129.215, "b": 252.87800000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9873637557029724, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Loss Functions."}, {"label": "text", "id": 3, "page_no": 5, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 336.846, "r": 545.115, "b": 345.398, "coord_origin": "TOPLEFT"}, "confidence": 0.9877589344978333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "For training, TableFormer is trained with 3 Adam opti-"}, {"label": "text", "id": 0, "page_no": 5, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 437.643, "r": 545.115, "b": 446.195, "coord_origin": "TOPLEFT"}, "confidence": 0.9884491562843323, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is implemented with PyTorch and Torchvi-"}, {"label": "text", "id": 11, "page_no": 5, "cluster": {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 448.279, "r": 286.365, "b": 456.831, "coord_origin": "TOPLEFT"}, "confidence": 0.9724196195602417, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The loss used to train the TableFormer can be defined as"}, {"label": "formula", "id": 15, "page_no": 5, "cluster": {"id": 15, "label": "formula", "bbox": {"l": 125.715, "t": 493.391, "r": 128.688, "b": 502.097, "coord_origin": "TOPLEFT"}, "confidence": 0.9423348307609558, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "l"}, {"label": "text", "id": 16, "page_no": 5, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 531.578, "r": 74.451, "b": 540.13, "coord_origin": "TOPLEFT"}, "confidence": 0.9363929629325867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where"}, {"label": "section_header", "id": 12, "page_no": 5, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 555.917, "r": 171.983, "b": 566.665, "coord_origin": "TOPLEFT"}, "confidence": 0.9554555416107178, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Experimental Results"}, {"label": "section_header", "id": 13, "page_no": 5, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 576.264, "r": 179.175, "b": 586.116, "coord_origin": "TOPLEFT"}, "confidence": 0.9538503289222717, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1. Implementation Details"}, {"label": "section_header", "id": 14, "page_no": 5, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 308.862, "t": 579.554, "r": 397.443, "b": 589.406, "coord_origin": "TOPLEFT"}, "confidence": 0.9450808763504028, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2. Generalization"}, {"label": "text", "id": 7, "page_no": 5, "cluster": {"id": 7, "label": "text", "bbox": {"l": 62.067, "t": 596.0029999999999, "r": 202.978, "b": 604.5550000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9856163263320923, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer uses ResNet-18 as the"}, {"label": "text", "id": 2, "page_no": 5, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 603.718, "r": 545.115, "b": 612.27, "coord_origin": "TOPLEFT"}, "confidence": 0.9880595803260803, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is evaluated on three major publicly avail-"}, {"label": "formula", "id": 18, "page_no": 5, "cluster": {"id": 18, "label": "formula", "bbox": {"l": 91.661, "t": 654.814, "r": 186.017, "b": 663.366, "coord_origin": "TOPLEFT"}, "confidence": 0.844183623790741, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image width and height"}, {"label": "text", "id": 8, "page_no": 5, "cluster": {"id": 8, "label": "text", "bbox": {"l": 320.817, "t": 680.604, "r": 545.115, "b": 689.156, "coord_origin": "TOPLEFT"}, "confidence": 0.9830910563468933, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We also share our baseline results on the challenging"}, {"label": "text", "id": 10, "page_no": 5, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.9724979996681213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although input constraints are used also by other methods,"}, {"label": "page_footer", "id": 17, "page_no": 5, "cluster": {"id": 17, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8820409178733826, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6"}], "body": [{"label": "text", "id": 5, "page_no": 5, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9868090152740479, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tention encoding is then multiplied to the encoded image to"}, {"label": "text", "id": 9, "page_no": 5, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9799237847328186, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "runtime performance and lower memory footprint of Table-"}, {"label": "text", "id": 1, "page_no": 5, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 116.49800000000005, "r": 545.115, "b": 125.04999999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9880930781364441, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Transformer Encoder consists of two 'Transformer"}, {"label": "text", "id": 6, "page_no": 5, "cluster": {"id": 6, "label": "text", "bbox": {"l": 62.067, "t": 159.89300000000003, "r": 108.154, "b": 168.44500000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9860327839851379, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The output"}, {"label": "text", "id": 4, "page_no": 5, "cluster": {"id": 4, "label": "text", "bbox": {"l": 62.067, "t": 243.92200000000003, "r": 129.215, "b": 252.87800000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9873637557029724, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Loss Functions."}, {"label": "text", "id": 3, "page_no": 5, "cluster": {"id": 3, "label": "text", "bbox": {"l": 320.817, "t": 336.846, "r": 545.115, "b": 345.398, "coord_origin": "TOPLEFT"}, "confidence": 0.9877589344978333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "For training, TableFormer is trained with 3 Adam opti-"}, {"label": "text", "id": 0, "page_no": 5, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 437.643, "r": 545.115, "b": 446.195, "coord_origin": "TOPLEFT"}, "confidence": 0.9884491562843323, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is implemented with PyTorch and Torchvi-"}, {"label": "text", "id": 11, "page_no": 5, "cluster": {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 448.279, "r": 286.365, "b": 456.831, "coord_origin": "TOPLEFT"}, "confidence": 0.9724196195602417, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The loss used to train the TableFormer can be defined as"}, {"label": "formula", "id": 15, "page_no": 5, "cluster": {"id": 15, "label": "formula", "bbox": {"l": 125.715, "t": 493.391, "r": 128.688, "b": 502.097, "coord_origin": "TOPLEFT"}, "confidence": 0.9423348307609558, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "l"}, {"label": "text", "id": 16, "page_no": 5, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 531.578, "r": 74.451, "b": 540.13, "coord_origin": "TOPLEFT"}, "confidence": 0.9363929629325867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where"}, {"label": "section_header", "id": 12, "page_no": 5, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 555.917, "r": 171.983, "b": 566.665, "coord_origin": "TOPLEFT"}, "confidence": 0.9554555416107178, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Experimental Results"}, {"label": "section_header", "id": 13, "page_no": 5, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 576.264, "r": 179.175, "b": 586.116, "coord_origin": "TOPLEFT"}, "confidence": 0.9538503289222717, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1. Implementation Details"}, {"label": "section_header", "id": 14, "page_no": 5, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 308.862, "t": 579.554, "r": 397.443, "b": 589.406, "coord_origin": "TOPLEFT"}, "confidence": 0.9450808763504028, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2. Generalization"}, {"label": "text", "id": 7, "page_no": 5, "cluster": {"id": 7, "label": "text", "bbox": {"l": 62.067, "t": 596.0029999999999, "r": 202.978, "b": 604.5550000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9856163263320923, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer uses ResNet-18 as the"}, {"label": "text", "id": 2, "page_no": 5, "cluster": {"id": 2, "label": "text", "bbox": {"l": 320.817, "t": 603.718, "r": 545.115, "b": 612.27, "coord_origin": "TOPLEFT"}, "confidence": 0.9880595803260803, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is evaluated on three major publicly avail-"}, {"label": "formula", "id": 18, "page_no": 5, "cluster": {"id": 18, "label": "formula", "bbox": {"l": 91.661, "t": 654.814, "r": 186.017, "b": 663.366, "coord_origin": "TOPLEFT"}, "confidence": 0.844183623790741, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image width and height"}, {"label": "text", "id": 8, "page_no": 5, "cluster": {"id": 8, "label": "text", "bbox": {"l": 320.817, "t": 680.604, "r": 545.115, "b": 689.156, "coord_origin": "TOPLEFT"}, "confidence": 0.9830910563468933, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We also share our baseline results on the challenging"}, {"label": "text", "id": 10, "page_no": 5, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.9724979996681213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although input constraints are used also by other methods,"}], "headers": [{"label": "page_footer", "id": 17, "page_no": 5, "cluster": {"id": 17, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8820409178733826, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6"}]}}, {"page_no": 6, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 114.12599999999998, "r_x1": 286.365, "r_y1": 114.12599999999998, "r_x2": 286.365, "r_y2": 105.57399999999996, "r_x3": 50.112, "r_y3": 105.57399999999996, "coord_origin": "TOPLEFT"}, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 126.08100000000002, "r_x1": 239.999, "r_y1": 126.08100000000002, "r_x2": 239.999, "r_y2": 117.529, "r_x3": 50.112, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "ground-truth as a tree structure of HTML tags.", "orig": "ground-truth as a tree structure of HTML tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.03, "r_y0": 126.08100000000002, "r_x1": 286.365, "r_y1": 126.08100000000002, "r_x2": 286.365, "r_y2": 117.529, "r_x3": 245.03, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "This simi-", "orig": "This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 138.03700000000003, "r_x1": 136.717, "r_y1": 138.03700000000003, "r_x2": 136.717, "r_y2": 129.485, "r_x3": 50.112, "r_y3": 129.485, "coord_origin": "TOPLEFT"}, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.875, "r_y0": 165.87400000000002, "r_x1": 139.77, "r_y1": 165.87400000000002, "r_x2": 139.77, "r_y2": 157.168, "r_x3": 118.875, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.697, "r_y0": 166.798, "r_x1": 129.019, "r_y1": 166.798, "r_x2": 129.019, "r_y2": 160.70399999999995, "r_x3": 124.697, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.766, "r_y0": 166.798, "r_x1": 143.27, "r_y1": 166.798, "r_x2": 143.27, "r_y2": 160.70399999999995, "r_x3": 139.766, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.768, "r_y0": 165.87400000000002, "r_x1": 165.902, "r_y1": 165.87400000000002, "r_x2": 165.902, "r_y2": 157.168, "r_x3": 143.768, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.121, "r_y0": 165.73199999999997, "r_x1": 175.87, "r_y1": 165.73199999999997, "r_x2": 175.87, "r_y2": 157.168, "r_x3": 168.121, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.279, "r_y0": 159.13400000000001, "r_x1": 221.957, "r_y1": 159.13400000000001, "r_x2": 221.957, "r_y2": 150.428, "r_x3": 179.279, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.952, "r_y0": 159.13400000000001, "r_x1": 242.848, "r_y1": 159.13400000000001, "r_x2": 242.848, "r_y2": 150.428, "r_x3": 221.952, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.774, "r_y0": 160.058, "r_x1": 232.096, "r_y1": 160.058, "r_x2": 232.096, "r_y2": 153.96400000000006, "r_x3": 227.774, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.843, "r_y0": 160.058, "r_x1": 246.347, "r_y1": 160.058, "r_x2": 246.347, "r_y2": 153.96400000000006, "r_x3": 242.843, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.845, "r_y0": 159.13400000000001, "r_x1": 250.719, "r_y1": 159.13400000000001, "r_x2": 250.719, "r_y2": 150.428, "r_x3": 246.845, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.212, "r_y0": 172.70799999999997, "r_x1": 206.292, "r_y1": 172.70799999999997, "r_x2": 206.292, "r_y2": 164.00199999999995, "r_x3": 182.212, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "max(", "orig": "max(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.289, "r_y0": 172.56600000000003, "r_x1": 209.057, "r_y1": 172.56600000000003, "r_x2": 209.057, "r_y2": 164.00199999999995, "r_x3": 206.289, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.056, "r_y0": 172.70799999999997, "r_x1": 214.878, "r_y1": 172.70799999999997, "r_x2": 214.878, "r_y2": 164.00199999999995, "r_x3": 209.056, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.878, "r_y0": 173.63199999999995, "r_x1": 219.2, "r_y1": 173.63199999999995, "r_x2": 219.2, "r_y2": 167.538, "r_x3": 214.878, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.697, "r_y0": 172.56600000000003, "r_x1": 222.465, "r_y1": 172.56600000000003, "r_x2": 222.465, "r_y2": 164.00199999999995, "r_x3": 219.697, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.125, "r_y0": 172.70799999999997, "r_x1": 226.893, "r_y1": 172.70799999999997, "r_x2": 226.893, "r_y2": 164.00199999999995, "r_x3": 224.125, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.553, "r_y0": 172.56600000000003, "r_x1": 231.321, "r_y1": 172.56600000000003, "r_x2": 231.321, "r_y2": 164.00199999999995, "r_x3": 228.553, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.32, "r_y0": 172.70799999999997, "r_x1": 237.142, "r_y1": 172.70799999999997, "r_x2": 237.142, "r_y2": 164.00199999999995, "r_x3": 231.32, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.142, "r_y0": 173.63199999999995, "r_x1": 240.646, "r_y1": 173.63199999999995, "r_x2": 240.646, "r_y2": 167.538, "r_x3": 237.142, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.144, "r_y0": 172.56600000000003, "r_x1": 243.912, "r_y1": 172.56600000000003, "r_x2": 243.912, "r_y2": 164.00199999999995, "r_x3": 241.144, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.911, "r_y0": 172.70799999999997, "r_x1": 247.785, "r_y1": 172.70799999999997, "r_x2": 247.785, "r_y2": 164.00199999999995, "r_x3": 243.911, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 166.038, "r_x1": 286.362, "r_y1": 166.038, "r_x2": 286.362, "r_y2": 157.486, "r_x3": 274.746, "r_y3": 157.486, "coord_origin": "TOPLEFT"}, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.581, "r_y0": 189.81899999999996, "r_x1": 94.403, "r_y1": 189.81899999999996, "r_x2": 94.403, "r_y2": 181.11300000000006, "r_x3": 88.581, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.403, "r_y0": 190.74199999999996, "r_x1": 98.725, "r_y1": 190.74199999999996, "r_x2": 98.725, "r_y2": 184.64800000000002, "r_x3": 94.403, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.399, "r_y0": 189.98299999999995, "r_x1": 115.785, "r_y1": 189.98299999999995, "r_x2": 115.785, "r_y2": 181.43100000000004, "r_x3": 101.399, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.961, "r_y0": 189.81899999999996, "r_x1": 123.783, "r_y1": 189.81899999999996, "r_x2": 123.783, "r_y2": 181.11300000000006, "r_x3": 117.961, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.783, "r_y0": 190.74199999999996, "r_x1": 127.287, "r_y1": 190.74199999999996, "r_x2": 127.287, "r_y2": 184.64800000000002, "r_x3": 123.783, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.96, "r_y0": 189.98299999999995, "r_x1": 286.363, "r_y1": 189.98299999999995, "r_x2": 286.363, "r_y2": 181.43100000000004, "r_x3": 129.96, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 201.938, "r_x1": 252.781, "r_y1": 201.938, "r_x2": 252.781, "r_y2": 193.38599999999997, "r_x3": 50.112, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.182, "r_y0": 201.63199999999995, "r_x1": 257.95, "r_y1": 201.63199999999995, "r_x2": 257.95, "r_y2": 193.06799999999998, "r_x3": 255.182, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.949, "r_y0": 201.774, "r_x1": 263.771, "r_y1": 201.774, "r_x2": 263.771, "r_y2": 193.06799999999998, "r_x3": 257.949, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.155, "r_y0": 201.63199999999995, "r_x1": 267.923, "r_y1": 201.63199999999995, "r_x2": 267.923, "r_y2": 193.06799999999998, "r_x3": 265.155, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.322, "r_y0": 201.938, "r_x1": 286.362, "r_y1": 201.938, "r_x2": 286.362, "r_y2": 193.38599999999997, "r_x3": 270.322, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 213.89300000000003, "r_x1": 172.134, "r_y1": 213.89300000000003, "r_x2": 172.134, "r_y2": 205.341, "r_x3": 50.112, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.624, "r_y0": 213.72900000000004, "r_x1": 180.446, "r_y1": 213.72900000000004, "r_x2": 180.446, "r_y2": 205.02300000000002, "r_x3": 174.624, "r_y3": 205.02300000000002, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.829, "r_y0": 213.89300000000003, "r_x1": 184.32, "r_y1": 213.89300000000003, "r_x2": 184.32, "r_y2": 205.341, "r_x3": 181.829, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.126, "r_y0": 252.59000000000003, "r_x1": 184.684, "r_y1": 252.59000000000003, "r_x2": 184.684, "r_y2": 244.038, "r_x3": 112.126, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.478, "r_y0": 252.59000000000003, "r_x1": 198.95, "r_y1": 252.59000000000003, "r_x2": 198.95, "r_y2": 244.038, "r_x3": 191.478, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.995, "r_y0": 252.59000000000003, "r_x1": 286.362, "r_y1": 252.59000000000003, "r_x2": 286.362, "r_y2": 244.038, "r_x3": 202.995, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "TableFormer outper-", "orig": "TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.54499999999996, "r_x1": 286.365, "r_y1": 264.54499999999996, "r_x2": 286.365, "r_y2": 255.99300000000005, "r_x3": 50.112, "r_y3": 255.99300000000005, "coord_origin": "TOPLEFT"}, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.5, "r_x1": 138.719, "r_y1": 276.5, "r_x2": 138.719, "r_y2": 267.948, "r_x3": 50.112, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "margin for predicting", "orig": "margin for predicting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.993, "r_y0": 276.5, "r_x1": 155.168, "r_y1": 276.5, "r_x2": 155.168, "r_y2": 267.948, "r_x3": 142.993, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.432, "r_y0": 276.5, "r_x1": 178.799, "r_y1": 276.5, "r_x2": 178.799, "r_y2": 267.948, "r_x3": 159.432, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.073, "r_y0": 276.5, "r_x1": 217.932, "r_y1": 276.5, "r_x2": 217.932, "r_y2": 267.948, "r_x3": 183.073, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.206, "r_y0": 276.5, "r_x1": 286.365, "r_y1": 276.5, "r_x2": 286.365, "r_y2": 267.948, "r_x3": 222.206, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "from an image.", "orig": "from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.455, "r_x1": 286.365, "r_y1": 288.455, "r_x2": 286.365, "r_y2": 279.903, "r_x3": 50.112, "r_y3": 279.903, "coord_origin": "TOPLEFT"}, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.411, "r_x1": 286.365, "r_y1": 300.411, "r_x2": 286.365, "r_y2": 291.859, "r_x3": 50.112, "r_y3": 291.859, "coord_origin": "TOPLEFT"}, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.366, "r_x1": 286.365, "r_y1": 312.366, "r_x2": 286.365, "r_y2": 303.814, "r_x3": 50.112, "r_y3": 303.814, "coord_origin": "TOPLEFT"}, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.321, "r_x1": 80.269, "r_y1": 324.321, "r_x2": 80.269, "r_y2": 315.769, "r_x3": 50.112, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.579, "r_y0": 324.321, "r_x1": 91.666, "r_y1": 324.321, "r_x2": 91.666, "r_y2": 315.769, "r_x3": 85.579, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "It", "orig": "It", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.894, "r_y0": 324.321, "r_x1": 257.812, "r_y1": 324.321, "r_x2": 257.812, "r_y2": 315.769, "r_x3": 94.894, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "has been observed that large tables (e.g.", "orig": "has been observed that large tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.122, "r_y0": 324.321, "r_x1": 286.365, "r_y1": 324.321, "r_x2": 286.365, "r_y2": 315.769, "r_x3": 263.122, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.276, "r_x1": 286.365, "r_y1": 336.276, "r_x2": 286.365, "r_y2": 327.724, "r_x3": 50.112, "r_y3": 327.724, "coord_origin": "TOPLEFT"}, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.231, "r_x1": 286.365, "r_y1": 348.231, "r_x2": 286.365, "r_y2": 339.679, "r_x3": 50.112, "r_y3": 339.679, "coord_origin": "TOPLEFT"}, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.186, "r_x1": 115.068, "r_y1": 360.186, "r_x2": 115.068, "r_y2": 351.634, "r_x3": 50.112, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "processing step,", "orig": "processing step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.203, "r_y0": 360.186, "r_x1": 134.147, "r_y1": 360.186, "r_x2": 134.147, "r_y2": 351.634, "r_x3": 119.203, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "that", "orig": "that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.952, "r_y0": 360.186, "r_x1": 286.365, "r_y1": 360.186, "r_x2": 286.365, "r_y2": 351.634, "r_x3": 137.952, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "produces downsampled images with", "orig": "produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.142, "r_x1": 155.357, "r_y1": 372.142, "r_x2": 155.357, "r_y2": 363.59, "r_x3": 50.112, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "indistinguishable features.", "orig": "indistinguishable features.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.378, "r_y0": 372.142, "r_x1": 286.365, "r_y1": 372.142, "r_x2": 286.365, "r_y2": 363.59, "r_x3": 160.378, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "This problem can be addressed", "orig": "This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.097, "r_x1": 286.365, "r_y1": 384.097, "r_x2": 286.365, "r_y2": 375.545, "r_x3": 50.112, "r_y3": 375.545, "coord_origin": "TOPLEFT"}, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.052, "r_x1": 170.012, "r_y1": 396.052, "r_x2": 170.012, "r_y2": 387.5, "r_x3": 50.112, "r_y3": 387.5, "coord_origin": "TOPLEFT"}, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.382, "r_y0": 601.254, "r_x1": 286.365, "r_y1": 601.254, "r_x2": 286.365, "r_y2": 592.702, "r_x3": 87.382, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Structure results on PubTabNet (PTN), FinTabNet", "orig": "Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 613.2090000000001, "r_x1": 247.461, "r_y1": 613.2090000000001, "r_x2": 247.461, "r_y2": 604.657, "r_x3": 50.112, "r_y3": 604.657, "coord_origin": "TOPLEFT"}, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.204, "r_y0": 653.29, "r_x1": 242.933, "r_y1": 653.29, "r_x2": 242.933, "r_y2": 644.738, "r_x3": 128.204, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.554, "r_y0": 653.1469999999999, "r_x1": 286.361, "r_y1": 653.1469999999999, "r_x2": 286.361, "r_y2": 644.559, "r_x3": 245.554, "r_y3": 644.559, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.102, "r_x1": 84.971, "r_y1": 665.102, "r_x2": 84.971, "r_y2": 656.514, "r_x3": 50.112, "r_y3": 656.514, "coord_origin": "TOPLEFT"}, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.515, "r_y0": 665.245, "r_x1": 123.677, "r_y1": 665.245, "r_x2": 123.677, "r_y2": 656.693, "r_x3": 89.515, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "provides", "orig": "provides", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.991, "r_y0": 665.245, "r_x1": 286.366, "r_y1": 665.245, "r_x2": 286.366, "r_y2": 656.693, "r_x3": 127.991, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "bounding boxes that can be improved", "orig": "bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.2, "r_x1": 286.365, "r_y1": 677.2, "r_x2": 286.365, "r_y2": 668.648, "r_x3": 50.112, "r_y3": 668.648, "coord_origin": "TOPLEFT"}, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 259.655, "r_y1": 689.156, "r_x2": 259.655, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "grid-like structure of tables to refine the predictions.", "orig": "grid-like structure of tables to refine the predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.65, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 263.65, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "A de-", "orig": "A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 147.068, "r_y1": 713.066, "r_x2": 147.068, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "supplementary material.", "orig": "supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.159, "r_y0": 713.066, "r_x1": 223.003, "r_y1": 713.066, "r_x2": 223.003, "r_y2": 704.514, "r_x3": 152.159, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.094, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 228.094, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "3, we evaluate", "orig": "3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 325.454, "r_y0": 83.88599999999997, "r_x1": 404.567, "r_y1": 83.88599999999997, "r_x2": 404.567, "r_y2": 75.298, "r_x3": 325.454, "r_y3": 75.298, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.104, "r_y0": 84.029, "r_x1": 545.11, "r_y1": 84.029, "r_x2": 545.11, "r_y2": 75.47699999999998, "r_x3": 408.104, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "bel of 'content' only using the PASCAL VOC mAP metric", "orig": "bel of 'content' only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 320.478, "r_y1": 107.93899999999996, "r_x2": 320.478, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.374, "r_y0": 107.93899999999996, "r_x1": 470.226, "r_y1": 107.93899999999996, "r_x2": 470.226, "r_y2": 99.38699999999994, "r_x3": 324.374, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "pre-processing and post-processing.", "orig": "pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.529, "r_y0": 107.93899999999996, "r_x1": 545.115, "r_y1": 107.93899999999996, "r_x2": 545.115, "r_y2": 99.38699999999994, "r_x3": 477.529, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 119.894, "r_x1": 545.115, "r_y1": 119.894, "r_x2": 545.115, "r_y2": 111.34199999999998, "r_x3": 308.862, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 131.84900000000005, "r_x1": 545.115, "r_y1": 131.84900000000005, "r_x2": 545.115, "r_y2": 123.29700000000003, "r_x3": 308.862, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 143.80499999999995, "r_x1": 502.017, "r_y1": 143.80499999999995, "r_x2": 502.017, "r_y2": 135.25300000000004, "r_x3": 308.862, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "posed approach, we've integrated TableFormer's", "orig": "posed approach, we've integrated TableFormer's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.473, "r_y0": 143.66200000000003, "r_x1": 545.11, "r_y1": 143.66200000000003, "r_x2": 545.11, "r_y2": 135.07399999999996, "r_x3": 504.473, "r_y3": 135.07399999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 155.61699999999996, "r_x1": 343.163, "r_y1": 155.61699999999996, "r_x2": 343.163, "r_y2": 147.029, "r_x3": 308.862, "r_y3": 147.029, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 155.76, "r_x1": 437.818, "r_y1": 155.76, "r_x2": 437.818, "r_y2": 147.20799999999997, "r_x3": 346.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "into EDD architecture.", "orig": "into EDD architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.371, "r_y0": 155.76, "r_x1": 545.115, "r_y1": 155.76, "r_x2": 545.115, "r_y2": 147.20799999999997, "r_x3": 442.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "As mentioned previously,", "orig": "As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 167.71500000000003, "r_x1": 446.157, "r_y1": 167.71500000000003, "r_x2": 446.157, "r_y2": 159.163, "r_x3": 308.862, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.29, "r_y0": 167.572, "r_x1": 525.042, "r_y1": 167.572, "r_x2": 525.042, "r_y2": 158.98400000000004, "r_x3": 448.29, "r_y3": 158.98400000000004, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.399, "r_y0": 167.71500000000003, "r_x1": 545.113, "r_y1": 167.71500000000003, "r_x2": 545.113, "r_y2": 159.163, "r_x3": 527.399, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 179.66999999999996, "r_x1": 545.115, "r_y1": 179.66999999999996, "r_x2": 545.115, "r_y2": 171.11800000000005, "r_x3": 308.862, "r_y3": 171.11800000000005, "coord_origin": "TOPLEFT"}, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 191.625, "r_x1": 432.866, "r_y1": 191.625, "r_x2": 432.866, "r_y2": 183.07299999999998, "r_x3": 308.862, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.39, "r_y0": 191.48199999999997, "r_x1": 510.93, "r_y1": 191.48199999999997, "r_x2": 510.93, "r_y2": 182.894, "r_x3": 436.39, "r_y3": 182.894, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.677, "r_y0": 191.625, "r_x1": 545.113, "r_y1": 191.625, "r_x2": 545.113, "r_y2": 183.07299999999998, "r_x3": 514.677, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 203.58000000000004, "r_x1": 431.173, "r_y1": 203.58000000000004, "r_x2": 431.173, "r_y2": 195.02800000000002, "r_x3": 308.862, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.679, "r_y0": 203.437, "r_x1": 514.181, "r_y1": 203.437, "r_x2": 514.181, "r_y2": 194.84900000000005, "r_x3": 434.679, "r_y3": 194.84900000000005, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.176, "r_y0": 203.58000000000004, "r_x1": 516.667, "r_y1": 203.58000000000004, "r_x2": 516.667, "r_y2": 195.02800000000002, "r_x3": 514.176, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.794, "r_y0": 203.58000000000004, "r_x1": 529.429, "r_y1": 203.58000000000004, "r_x2": 529.429, "r_y2": 195.02800000000002, "r_x3": 522.794, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "If", "orig": "If", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.936, "r_y0": 203.58000000000004, "r_x1": 545.11, "r_y1": 203.58000000000004, "r_x2": 545.11, "r_y2": 195.02800000000002, "r_x3": 532.936, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 215.39300000000003, "r_x1": 382.356, "r_y1": 215.39300000000003, "r_x2": 382.356, "r_y2": 206.80499999999995, "r_x3": 308.862, "r_y3": 206.80499999999995, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.075, "r_y0": 215.53599999999994, "r_x1": 545.114, "r_y1": 215.53599999999994, "r_x2": 545.114, "r_y2": 206.98400000000004, "r_x3": 385.075, "r_y3": 206.98400000000004, "coord_origin": "TOPLEFT"}, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 227.49099999999999, "r_x1": 501.698, "r_y1": 227.49099999999999, "r_x2": 501.698, "r_y2": 218.93899999999996, "r_x3": 308.862, "r_y3": 218.93899999999996, "coord_origin": "TOPLEFT"}, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.603, "r_y0": 325.27, "r_x1": 545.115, "r_y1": 325.27, "r_x2": 545.115, "r_y2": 316.718, "r_x3": 348.603, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.225, "r_x1": 474.978, "r_y1": 337.225, "r_x2": 474.978, "r_y2": 328.673, "r_x3": 308.862, "r_y3": 328.673, "coord_origin": "TOPLEFT"}, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 387.079, "r_y0": 376.62, "r_x1": 395.378, "r_y1": 376.62, "r_x2": 395.378, "r_y2": 368.068, "r_x3": 387.079, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.552, "r_y0": 376.62, "r_x1": 413.948, "r_y1": 376.62, "r_x2": 413.948, "r_y2": 368.068, "r_x3": 399.552, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.112, "r_y0": 376.62, "r_x1": 448.827, "r_y1": 376.62, "r_x2": 448.827, "r_y2": 368.068, "r_x3": 418.112, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "section,", "orig": "section,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.42, "r_y0": 376.62, "r_x1": 545.116, "r_y1": 376.62, "r_x2": 545.116, "r_y2": 368.068, "r_x3": 453.42, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "we evaluate the entire", "orig": "we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.575, "r_x1": 487.193, "r_y1": 388.575, "r_x2": 487.193, "r_y2": 380.023, "r_x3": 308.862, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.967, "r_y0": 388.575, "r_x1": 545.115, "r_y1": 388.575, "r_x2": 545.115, "r_y2": 380.023, "r_x3": 493.967, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.53, "r_x1": 545.115, "r_y1": 400.53, "r_x2": 545.115, "r_y2": 391.978, "r_x3": 308.862, "r_y3": 391.978, "coord_origin": "TOPLEFT"}, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.486, "r_x1": 545.115, "r_y1": 412.486, "r_x2": 545.115, "r_y2": 403.934, "r_x3": 308.862, "r_y3": 403.934, "coord_origin": "TOPLEFT"}, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.441, "r_x1": 545.115, "r_y1": 424.441, "r_x2": 545.115, "r_y2": 415.889, "r_x3": 308.862, "r_y3": 415.889, "coord_origin": "TOPLEFT"}, "text": "4 shows the TEDs score of HTML code representing the", "orig": "4 shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.396, "r_x1": 545.115, "r_y1": 436.396, "r_x2": 545.115, "r_y2": 427.844, "r_x3": 308.862, "r_y3": 427.844, "coord_origin": "TOPLEFT"}, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.351, "r_x1": 545.115, "r_y1": 448.351, "r_x2": 545.115, "r_y2": 439.799, "r_x3": 308.862, "r_y3": 439.799, "coord_origin": "TOPLEFT"}, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 460.306, "r_x1": 350.237, "r_y1": 460.306, "r_x2": 350.237, "r_y2": 451.754, "r_x3": 308.862, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.176, "r_y0": 460.322, "r_x1": 374.592, "r_y1": 460.322, "r_x2": 374.592, "r_y2": 451.366, "r_x3": 352.176, "r_y3": 451.366, "coord_origin": "TOPLEFT"}, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.533, "r_y0": 460.306, "r_x1": 545.11, "r_y1": 460.306, "r_x2": 545.11, "r_y2": 451.754, "r_x3": 376.533, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 472.261, "r_x1": 380.523, "r_y1": 472.261, "r_x2": 380.523, "r_y2": 463.709, "r_x3": 308.862, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "mercial solutions.", "orig": "mercial solutions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.042, "r_y0": 472.261, "r_x1": 545.115, "r_y1": 472.261, "r_x2": 545.115, "r_y2": 463.709, "r_x3": 386.042, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "We believe our scores would be higher", "orig": "We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.217, "r_x1": 314.949, "r_y1": 484.217, "r_x2": 314.949, "r_y2": 475.665, "r_x3": 308.862, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.008, "r_y0": 484.217, "r_x1": 545.115, "r_y1": 484.217, "r_x2": 545.115, "r_y2": 475.665, "r_x3": 318.008, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "the HTML ground-truth matched the extracted PDF cell", "orig": "the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.172, "r_x1": 340.683, "r_y1": 496.172, "r_x2": 340.683, "r_y2": 487.62, "r_x3": 308.862, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "content.", "orig": "content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.793, "r_y0": 496.172, "r_x1": 545.115, "r_y1": 496.172, "r_x2": 545.115, "r_y2": 487.62, "r_x3": 345.793, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, there are small discrepancies such", "orig": "Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.127, "r_x1": 545.115, "r_y1": 508.127, "r_x2": 545.115, "r_y2": 499.575, "r_x3": 308.862, "r_y3": 499.575, "coord_origin": "TOPLEFT"}, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.082, "r_x1": 405.698, "r_y1": 520.082, "r_x2": 405.698, "r_y2": 511.53, "r_x3": 308.862, "r_y3": 511.53, "coord_origin": "TOPLEFT"}, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 349.559, "r_y0": 665.682, "r_x1": 545.115, "r_y1": 665.682, "r_x2": 545.115, "r_y2": 657.13, "r_x3": 349.559, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.637, "r_x1": 425.763, "r_y1": 677.637, "r_x2": 425.763, "r_y2": 669.085, "r_x3": 308.862, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "cell detection on PubTabNet.", "orig": "cell detection on PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.336, "r_y0": 677.637, "r_x1": 545.115, "r_y1": 677.637, "r_x2": 545.115, "r_y2": 669.085, "r_x3": 430.336, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "In all cases the input is PDF", "orig": "In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.592, "r_x1": 435.038, "r_y1": 689.592, "r_x2": 435.038, "r_y2": 681.04, "r_x3": 308.862, "r_y3": 681.04, "coord_origin": "TOPLEFT"}, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 10, "label": "section_header", "bbox": {"l": 50.112, "t": 74.40099999999995, "r": 167.898, "b": 84.25300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9554274082183838, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 322.142, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9713197946548462, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 93.61900000000003, "r": 286.365, "b": 102.17100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9862998127937317, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "formula", "bbox": {"l": 86.219, "t": 157.168, "r": 118.878, "b": 165.87400000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9500409364700317, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "text", "bbox": {"l": 62.067, "t": 181.43100000000004, "r": 86.406, "b": 189.98299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9735319018363953, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "section_header", "bbox": {"l": 50.112, "t": 224.81899999999996, "r": 170.452, "b": 234.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9588837027549744, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 243.64999999999998, "r": 105.325, "b": 252.606, "coord_origin": "TOPLEFT"}, "confidence": 0.9855090975761414, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "caption", "bbox": {"l": 308.862, "t": 316.718, "r": 341.499, "b": 325.27, "coord_origin": "TOPLEFT"}, "confidence": 0.9519917964935303, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 320.817, "t": 367.68, "r": 378.949, "b": 376.636, "coord_origin": "TOPLEFT"}, "confidence": 0.9835010766983032, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 50.112, "t": 592.702, "r": 82.062, "b": 601.254, "coord_origin": "TOPLEFT"}, "confidence": 0.7209173440933228, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 616.612, "r": 261.787, "b": 625.164, "coord_origin": "TOPLEFT"}, "confidence": 0.6433312892913818, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 644.35, "r": 124.722, "b": 653.306, "coord_origin": "TOPLEFT"}, "confidence": 0.9854635000228882, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 657.13, "r": 341.739, "b": 665.682, "coord_origin": "TOPLEFT"}, "confidence": 0.9541404247283936, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8787972331047058, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [], "children": []}, {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [], "children": []}, {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"8": {"label": "table", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "0": {"label": "table", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "5": {"label": "table", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "section_header", "id": 10, "page_no": 6, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 50.112, "t": 74.40099999999995, "r": 167.898, "b": 84.25300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9554274082183838, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.3. Datasets and Metrics"}, {"label": "text", "id": 7, "page_no": 6, "cluster": {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 322.142, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9713197946548462, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "our"}, {"label": "text", "id": 1, "page_no": 6, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 93.61900000000003, "r": 286.365, "b": 102.17100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9862998127937317, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-"}, {"label": "formula", "id": 13, "page_no": 6, "cluster": {"id": 13, "label": "formula", "bbox": {"l": 86.219, "t": 157.168, "r": 118.878, "b": 165.87400000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9500409364700317, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TEDS("}, {"label": "text", "id": 6, "page_no": 6, "cluster": {"id": 6, "label": "text", "bbox": {"l": 62.067, "t": 181.43100000000004, "r": 86.406, "b": 189.98299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9735319018363953, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where"}, {"label": "section_header", "id": 9, "page_no": 6, "cluster": {"id": 9, "label": "section_header", "bbox": {"l": 50.112, "t": 224.81899999999996, "r": 170.452, "b": 234.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9588837027549744, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.4. Quantitative Analysis"}, {"label": "text", "id": 2, "page_no": 6, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 243.64999999999998, "r": 105.325, "b": 252.606, "coord_origin": "TOPLEFT"}, "confidence": 0.9855090975761414, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure."}, {"label": "caption", "id": 12, "page_no": 6, "cluster": {"id": 12, "label": "caption", "bbox": {"l": 308.862, "t": 316.718, "r": 341.499, "b": 325.27, "coord_origin": "TOPLEFT"}, "confidence": 0.9519917964935303, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 3:"}, {"label": "text", "id": 4, "page_no": 6, "cluster": {"id": 4, "label": "text", "bbox": {"l": 320.817, "t": 367.68, "r": 378.949, "b": 376.636, "coord_origin": "TOPLEFT"}, "confidence": 0.9835010766983032, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Content."}, {"label": "text", "id": 15, "page_no": 6, "cluster": {"id": 15, "label": "text", "bbox": {"l": 50.112, "t": 592.702, "r": 82.062, "b": 601.254, "coord_origin": "TOPLEFT"}, "confidence": 0.7209173440933228, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 2:"}, {"label": "text", "id": 16, "page_no": 6, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 616.612, "r": 261.787, "b": 625.164, "coord_origin": "TOPLEFT"}, "confidence": 0.6433312892913818, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "FT: Model was trained on PubTabNet then finetuned."}, {"label": "text", "id": 3, "page_no": 6, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 644.35, "r": 124.722, "b": 653.306, "coord_origin": "TOPLEFT"}, "confidence": 0.9854635000228882, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Detection."}, {"label": "caption", "id": 11, "page_no": 6, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 657.13, "r": 341.739, "b": 665.682, "coord_origin": "TOPLEFT"}, "confidence": 0.9541404247283936, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 4:"}, {"label": "page_footer", "id": 14, "page_no": 6, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8787972331047058, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7"}, {"label": "table", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "section_header", "id": 10, "page_no": 6, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 50.112, "t": 74.40099999999995, "r": 167.898, "b": 84.25300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9554274082183838, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.3. Datasets and Metrics"}, {"label": "text", "id": 7, "page_no": 6, "cluster": {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 322.142, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.9713197946548462, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "our"}, {"label": "text", "id": 1, "page_no": 6, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 93.61900000000003, "r": 286.365, "b": 102.17100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9862998127937317, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-"}, {"label": "formula", "id": 13, "page_no": 6, "cluster": {"id": 13, "label": "formula", "bbox": {"l": 86.219, "t": 157.168, "r": 118.878, "b": 165.87400000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9500409364700317, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TEDS("}, {"label": "text", "id": 6, "page_no": 6, "cluster": {"id": 6, "label": "text", "bbox": {"l": 62.067, "t": 181.43100000000004, "r": 86.406, "b": 189.98299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9735319018363953, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where"}, {"label": "section_header", "id": 9, "page_no": 6, "cluster": {"id": 9, "label": "section_header", "bbox": {"l": 50.112, "t": 224.81899999999996, "r": 170.452, "b": 234.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9588837027549744, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.4. Quantitative Analysis"}, {"label": "text", "id": 2, "page_no": 6, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 243.64999999999998, "r": 105.325, "b": 252.606, "coord_origin": "TOPLEFT"}, "confidence": 0.9855090975761414, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure."}, {"label": "caption", "id": 12, "page_no": 6, "cluster": {"id": 12, "label": "caption", "bbox": {"l": 308.862, "t": 316.718, "r": 341.499, "b": 325.27, "coord_origin": "TOPLEFT"}, "confidence": 0.9519917964935303, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 3:"}, {"label": "text", "id": 4, "page_no": 6, "cluster": {"id": 4, "label": "text", "bbox": {"l": 320.817, "t": 367.68, "r": 378.949, "b": 376.636, "coord_origin": "TOPLEFT"}, "confidence": 0.9835010766983032, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Content."}, {"label": "text", "id": 15, "page_no": 6, "cluster": {"id": 15, "label": "text", "bbox": {"l": 50.112, "t": 592.702, "r": 82.062, "b": 601.254, "coord_origin": "TOPLEFT"}, "confidence": 0.7209173440933228, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 2:"}, {"label": "text", "id": 16, "page_no": 6, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 616.612, "r": 261.787, "b": 625.164, "coord_origin": "TOPLEFT"}, "confidence": 0.6433312892913818, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "FT: Model was trained on PubTabNet then finetuned."}, {"label": "text", "id": 3, "page_no": 6, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 644.35, "r": 124.722, "b": 653.306, "coord_origin": "TOPLEFT"}, "confidence": 0.9854635000228882, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Detection."}, {"label": "caption", "id": 11, "page_no": 6, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 657.13, "r": 341.739, "b": 665.682, "coord_origin": "TOPLEFT"}, "confidence": 0.9541404247283936, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 4:"}, {"label": "table", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_footer", "id": 14, "page_no": 6, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8787972331047058, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7"}]}}, {"page_no": 7, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.918, "r_y0": 329.698, "r_x1": 545.114, "r_y1": 329.698, "r_x2": 545.114, "r_y2": 321.146, "r_x3": 93.918, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 341.653, "r_x1": 545.114, "r_y1": 341.653, "r_x2": 545.114, "r_y2": 333.101, "r_x3": 50.112, "r_y3": 333.101, "coord_origin": "TOPLEFT"}, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 353.608, "r_x1": 545.114, "r_y1": 353.608, "r_x2": 545.114, "r_y2": 345.056, "r_x3": 50.112, "r_y3": 345.056, "coord_origin": "TOPLEFT"}, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.564, "r_x1": 139.795, "r_y1": 365.564, "r_x2": 139.795, "r_y2": 357.012, "r_x3": 50.112, "r_y3": 357.012, "coord_origin": "TOPLEFT"}, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.428, "r_y0": 467.549, "r_x1": 532.63, "r_y1": 467.549, "r_x2": 532.63, "r_y2": 458.997, "r_x3": 104.428, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.985, "r_y0": 545.694, "r_x1": 151.8, "r_y1": 545.694, "r_x2": 151.8, "r_y2": 537.142, "r_x3": 123.985, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "several", "orig": "several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.28, "r_y0": 545.694, "r_x1": 212.074, "r_y1": 545.694, "r_x2": 212.074, "r_y2": 537.142, "r_x3": 157.28, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "visualizations", "orig": "visualizations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.553, "r_y0": 545.694, "r_x1": 229.17, "r_y1": 545.694, "r_x2": 229.17, "r_y2": 537.142, "r_x3": 217.553, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.659, "r_y0": 545.694, "r_x1": 246.833, "r_y1": 545.694, "r_x2": 246.833, "r_y2": 537.142, "r_x3": 234.659, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.313, "r_y0": 545.694, "r_x1": 286.365, "r_y1": 545.694, "r_x2": 286.365, "r_y2": 537.142, "r_x3": 252.313, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 557.649, "r_x1": 211.157, "r_y1": 557.649, "r_x2": 211.157, "r_y2": 549.097, "r_x3": 50.112, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.1, "r_y0": 557.506, "r_x1": 259.175, "r_y1": 557.506, "r_x2": 259.175, "r_y2": 548.918, "r_x3": 215.1, "r_y3": 548.918, "coord_origin": "TOPLEFT"}, "text": "'complex'", "orig": "'complex'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.12, "r_y0": 557.649, "r_x1": 286.363, "r_y1": 557.649, "r_x2": 286.363, "r_y2": 549.097, "r_x3": 263.12, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 569.604, "r_x1": 231.72, "r_y1": 569.604, "r_x2": 231.72, "r_y2": 561.052, "r_x3": 50.112, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "within datasets presented in this work in Fig.", "orig": "within datasets presented in this work in Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.064, "r_y0": 569.604, "r_x1": 277.03, "r_y1": 569.604, "r_x2": 277.03, "r_y2": 561.052, "r_x3": 236.064, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "5 and Fig.", "orig": "5 and Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.384, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 281.384, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 122.341, "r_y1": 593.514, "r_x2": 122.341, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "for all table cells,", "orig": "for all table cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.107, "r_y0": 593.514, "r_x1": 228.004, "r_y1": 593.514, "r_x2": 228.004, "r_y2": 584.962, "r_x3": 126.107, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "even for the empty ones.", "orig": "even for the empty ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.151, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 234.151, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 230.873, "r_y1": 629.38, "r_x2": 230.873, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "based on their overlap and spatial proximity.", "orig": "based on their overlap and spatial proximity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.855, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 235.855, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "The left part", "orig": "The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 77.121, "r_y1": 641.335, "r_x2": 77.121, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "of Fig.", "orig": "of Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.544, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 81.544, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "5 demonstrates also the adaptability of our method", "orig": "5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 57.863, "r_y1": 653.29, "r_x2": 57.863, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.436, "r_y0": 653.29, "r_x1": 119.691, "r_y1": 653.29, "r_x2": 119.691, "r_y2": 644.738, "r_x3": 62.436, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "any language,", "orig": "any language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.782, "r_y0": 653.29, "r_x1": 133.081, "r_y1": 653.29, "r_x2": 133.081, "r_y2": 644.738, "r_x3": 124.782, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.653, "r_y0": 653.29, "r_x1": 143.193, "r_y1": 653.29, "r_x2": 143.193, "r_y2": 644.738, "r_x3": 137.653, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.765, "r_y0": 653.29, "r_x1": 214.854, "r_y1": 653.29, "r_x2": 214.854, "r_y2": 644.738, "r_x3": 147.765, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "can successfully", "orig": "can successfully", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.426, "r_y0": 653.29, "r_x1": 246.385, "r_y1": 653.29, "r_x2": 246.385, "r_y2": 644.738, "r_x3": 219.426, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "extract", "orig": "extract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.958, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 250.958, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Japanese", "orig": "Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 195.217, "r_y1": 689.156, "r_x2": 195.217, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "steps in the supplementary material.", "orig": "steps in the supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.431, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 199.431, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Overall these illustra-", "orig": "Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 226.888, "r_y1": 713.066, "r_x2": 226.888, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work & Conclusion", "orig": "6. Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.669, "r_x1": 545.115, "r_y1": 533.669, "r_x2": 545.115, "r_y2": 525.117, "r_x3": 308.862, "r_y3": 525.117, "coord_origin": "TOPLEFT"}, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.624, "r_x1": 545.115, "r_y1": 545.624, "r_x2": 545.115, "r_y2": 537.072, "r_x3": 308.862, "r_y3": 537.072, "coord_origin": "TOPLEFT"}, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.579, "r_x1": 545.115, "r_y1": 557.579, "r_x2": 545.115, "r_y2": 549.027, "r_x3": 308.862, "r_y3": 549.027, "coord_origin": "TOPLEFT"}, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.534, "r_x1": 524.562, "r_y1": 569.534, "r_x2": 524.562, "r_y2": 560.982, "r_x3": 308.862, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "content from PDF or OCR by using bounding boxes.", "orig": "content from PDF or OCR by using bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 569.534, "r_x1": 545.115, "r_y1": 569.534, "r_x2": 545.115, "r_y2": 560.982, "r_x3": 529.623, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "Ad-", "orig": "Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.489, "r_x1": 545.115, "r_y1": 581.489, "r_x2": 545.115, "r_y2": 572.937, "r_x3": 308.862, "r_y3": 572.937, "coord_origin": "TOPLEFT"}, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4449999999999, "r_x1": 545.115, "r_y1": 593.4449999999999, "r_x2": 545.115, "r_y2": 584.893, "r_x3": 308.862, "r_y3": 584.893, "coord_origin": "TOPLEFT"}, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.4, "r_x1": 335.153, "r_y1": 605.4, "r_x2": 335.153, "r_y2": 596.848, "r_x3": 308.862, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "ments,", "orig": "ments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.656, "r_y0": 605.4, "r_x1": 400.468, "r_y1": 605.4, "r_x2": 400.468, "r_y2": 596.848, "r_x3": 339.656, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "and languages.", "orig": "and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.378, "r_y0": 605.4, "r_x1": 460.672, "r_y1": 605.4, "r_x2": 460.672, "r_y2": 596.848, "r_x3": 408.378, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.175, "r_y0": 605.4, "r_x1": 545.115, "r_y1": 605.4, "r_x2": 545.115, "r_y2": 596.848, "r_x3": 465.175, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "our method outper-", "orig": "our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.355, "r_x1": 495.471, "r_y1": 617.355, "r_x2": 495.471, "r_y2": 608.803, "r_x3": 308.862, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "forms all state-of-the-arts with a wide margin.", "orig": "forms all state-of-the-arts with a wide margin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.234, "r_y0": 617.355, "r_x1": 545.115, "r_y1": 617.355, "r_x2": 545.115, "r_y2": 608.803, "r_x3": 500.234, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "Finally, we", "orig": "Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.31, "r_x1": 545.115, "r_y1": 629.31, "r_x2": 545.115, "r_y2": 620.758, "r_x3": 308.862, "r_y3": 620.758, "coord_origin": "TOPLEFT"}, "text": "introduce 'SynthTabNet' a challenging synthetically gen-", "orig": "introduce 'SynthTabNet' a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.265, "r_x1": 545.115, "r_y1": 641.265, "r_x2": 545.115, "r_y2": 632.713, "r_x3": 308.862, "r_y3": 632.713, "coord_origin": "TOPLEFT"}, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.22, "r_x1": 365.858, "r_y1": 653.22, "r_x2": 365.858, "r_y2": 644.668, "r_x3": 308.862, "r_y3": 644.668, "coord_origin": "TOPLEFT"}, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 701.901, "r_x1": 545.109, "r_y1": 701.901, "r_x2": 545.109, "r_y2": 694.204, "r_x3": 328.785, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 545.113, "r_y1": 712.86, "r_x2": 545.113, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 21, "label": "list_item", "bbox": {"l": 53.286, "t": 78.995, "r": 499.556, "b": 86.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.541211724281311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "section_header", "bbox": {"l": 53.812, "t": 94.58900000000006, "r": 284.346, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.46452972292900085, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "section_header", "bbox": {"l": 304.831, "t": 94.58900000000006, "r": 431.091, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.4629225730895996, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "caption", "bbox": {"l": 53.812, "t": 208.54100000000005, "r": 385.934, "b": 216.02300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.5986505746841431, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "caption", "bbox": {"l": 380.427, "t": 292.551, "r": 549.422, "b": 298.536, "coord_origin": "TOPLEFT"}, "confidence": 0.7499915957450867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 321.146, "r": 86.864, "b": 329.698, "coord_origin": "TOPLEFT"}, "confidence": 0.9140303134918213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "caption", "bbox": {"l": 62.595, "t": 458.997, "r": 98.849, "b": 467.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9153602719306946, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "section_header", "bbox": {"l": 308.862, "t": 490.709, "r": 460.848, "b": 501.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9436525702476501, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work & Conclusion", "orig": "6. Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "section_header", "bbox": {"l": 50.112, "t": 491.395, "r": 163.756, "b": 501.247, "coord_origin": "TOPLEFT"}, "confidence": 0.9561247229576111, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 513.162, "r": 545.115, "b": 521.7139999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9875594973564148, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 537.142, "r": 118.505, "b": 545.694, "coord_origin": "TOPLEFT"}, "confidence": 0.9852361679077148, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "section_header", "bbox": {"l": 308.862, "t": 672.099, "r": 364.406, "b": 682.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9442470073699951, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 313.345, "t": 694.204, "r": 323.8, "b": 701.901, "coord_origin": "TOPLEFT"}, "confidence": 0.8318753838539124, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8709858059883118, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "picture", "bbox": {"l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT"}, "confidence": 0.7699173092842102, "cells": [], "children": []}, {"id": 14, "label": "picture", "bbox": {"l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT"}, "confidence": 0.7873926162719727, "cells": [], "children": []}, {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [], "children": []}, {"id": 11, "label": "picture", "bbox": {"l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT"}, "confidence": 0.8308426737785339, "cells": [], "children": []}, {"id": 12, "label": "picture", "bbox": {"l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT"}, "confidence": 0.805853009223938, "cells": [], "children": []}, {"id": 13, "label": "picture", "bbox": {"l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT"}, "confidence": 0.7881615161895752, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"7": {"label": "table", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "8": {"label": "table", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "list_item", "id": 21, "page_no": 7, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 53.286, "t": 78.995, "r": 499.556, "b": 86.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.541211724281311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"}, {"label": "section_header", "id": 29, "page_no": 7, "cluster": {"id": 29, "label": "section_header", "bbox": {"l": 53.812, "t": 94.58900000000006, "r": 284.346, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.46452972292900085, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Japanese language (previously unseen by TableFormer):"}, {"label": "section_header", "id": 31, "page_no": 7, "cluster": {"id": 31, "label": "section_header", "bbox": {"l": 304.831, "t": 94.58900000000006, "r": 431.091, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.4629225730895996, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Example table from FinTabNet:"}, {"label": "caption", "id": 18, "page_no": 7, "cluster": {"id": 18, "label": "caption", "bbox": {"l": 53.812, "t": 208.54100000000005, "r": 385.934, "b": 216.02300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.5986505746841431, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"}, {"label": "caption", "id": 16, "page_no": 7, "cluster": {"id": 16, "label": "caption", "bbox": {"l": 380.427, "t": 292.551, "r": 549.422, "b": 298.536, "coord_origin": "TOPLEFT"}, "confidence": 0.7499915957450867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Text is aligned to match original for ease of viewing"}, {"label": "caption", "id": 6, "page_no": 7, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 321.146, "r": 86.864, "b": 329.698, "coord_origin": "TOPLEFT"}, "confidence": 0.9140303134918213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 5:"}, {"label": "caption", "id": 5, "page_no": 7, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 62.595, "t": 458.997, "r": 98.849, "b": 467.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9153602719306946, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 6:"}, {"label": "section_header", "id": 4, "page_no": 7, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 308.862, "t": 490.709, "r": 460.848, "b": 501.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9436525702476501, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work & Conclusion", "orig": "6. Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Future Work & Conclusion"}, {"label": "section_header", "id": 2, "page_no": 7, "cluster": {"id": 2, "label": "section_header", "bbox": {"l": 50.112, "t": 491.395, "r": 163.756, "b": 501.247, "coord_origin": "TOPLEFT"}, "confidence": 0.9561247229576111, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.5. Qualitative Analysis"}, {"label": "text", "id": 0, "page_no": 7, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 513.162, "r": 545.115, "b": 521.7139999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9875594973564148, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we presented TableFormer an end-to-end"}, {"label": "text", "id": 1, "page_no": 7, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 537.142, "r": 118.505, "b": 545.694, "coord_origin": "TOPLEFT"}, "confidence": 0.9852361679077148, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We showcase"}, {"label": "section_header", "id": 3, "page_no": 7, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 308.862, "t": 672.099, "r": 364.406, "b": 682.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9442470073699951, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "References"}, {"label": "list_item", "id": 10, "page_no": 7, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 313.345, "t": 694.204, "r": 323.8, "b": 701.901, "coord_origin": "TOPLEFT"}, "confidence": 0.8318753838539124, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[1]"}, {"label": "page_footer", "id": 9, "page_no": 7, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8709858059883118, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8"}, {"label": "picture", "id": 15, "page_no": 7, "cluster": {"id": 15, "label": "picture", "bbox": {"l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT"}, "confidence": 0.7699173092842102, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 14, "page_no": 7, "cluster": {"id": 14, "label": "picture", "bbox": {"l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT"}, "confidence": 0.7873926162719727, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 11, "page_no": 7, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT"}, "confidence": 0.8308426737785339, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 12, "page_no": 7, "cluster": {"id": 12, "label": "picture", "bbox": {"l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT"}, "confidence": 0.805853009223938, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 13, "page_no": 7, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT"}, "confidence": 0.7881615161895752, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "list_item", "id": 21, "page_no": 7, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 53.286, "t": 78.995, "r": 499.556, "b": 86.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.541211724281311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"}, {"label": "section_header", "id": 29, "page_no": 7, "cluster": {"id": 29, "label": "section_header", "bbox": {"l": 53.812, "t": 94.58900000000006, "r": 284.346, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.46452972292900085, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Japanese language (previously unseen by TableFormer):"}, {"label": "section_header", "id": 31, "page_no": 7, "cluster": {"id": 31, "label": "section_header", "bbox": {"l": 304.831, "t": 94.58900000000006, "r": 431.091, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.4629225730895996, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Example table from FinTabNet:"}, {"label": "caption", "id": 18, "page_no": 7, "cluster": {"id": 18, "label": "caption", "bbox": {"l": 53.812, "t": 208.54100000000005, "r": 385.934, "b": 216.02300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.5986505746841431, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"}, {"label": "caption", "id": 16, "page_no": 7, "cluster": {"id": 16, "label": "caption", "bbox": {"l": 380.427, "t": 292.551, "r": 549.422, "b": 298.536, "coord_origin": "TOPLEFT"}, "confidence": 0.7499915957450867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Text is aligned to match original for ease of viewing"}, {"label": "caption", "id": 6, "page_no": 7, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 321.146, "r": 86.864, "b": 329.698, "coord_origin": "TOPLEFT"}, "confidence": 0.9140303134918213, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 5:"}, {"label": "caption", "id": 5, "page_no": 7, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 62.595, "t": 458.997, "r": 98.849, "b": 467.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9153602719306946, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 6:"}, {"label": "section_header", "id": 4, "page_no": 7, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 308.862, "t": 490.709, "r": 460.848, "b": 501.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9436525702476501, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work & Conclusion", "orig": "6. Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Future Work & Conclusion"}, {"label": "section_header", "id": 2, "page_no": 7, "cluster": {"id": 2, "label": "section_header", "bbox": {"l": 50.112, "t": 491.395, "r": 163.756, "b": 501.247, "coord_origin": "TOPLEFT"}, "confidence": 0.9561247229576111, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.5. Qualitative Analysis"}, {"label": "text", "id": 0, "page_no": 7, "cluster": {"id": 0, "label": "text", "bbox": {"l": 320.817, "t": 513.162, "r": 545.115, "b": 521.7139999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9875594973564148, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we presented TableFormer an end-to-end"}, {"label": "text", "id": 1, "page_no": 7, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 537.142, "r": 118.505, "b": 545.694, "coord_origin": "TOPLEFT"}, "confidence": 0.9852361679077148, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We showcase"}, {"label": "section_header", "id": 3, "page_no": 7, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 308.862, "t": 672.099, "r": 364.406, "b": 682.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9442470073699951, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "References"}, {"label": "list_item", "id": 10, "page_no": 7, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 313.345, "t": 694.204, "r": 323.8, "b": 701.901, "coord_origin": "TOPLEFT"}, "confidence": 0.8318753838539124, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[1]"}, {"label": "picture", "id": 15, "page_no": 7, "cluster": {"id": 15, "label": "picture", "bbox": {"l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT"}, "confidence": 0.7699173092842102, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 14, "page_no": 7, "cluster": {"id": 14, "label": "picture", "bbox": {"l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT"}, "confidence": 0.7873926162719727, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 11, "page_no": 7, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT"}, "confidence": 0.8308426737785339, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 12, "page_no": 7, "cluster": {"id": 12, "label": "picture", "bbox": {"l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT"}, "confidence": 0.805853009223938, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 13, "page_no": 7, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT"}, "confidence": 0.7881615161895752, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 9, "page_no": 7, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8709858059883118, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8"}]}}, {"page_no": 8, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.313, "r_y0": 83.82299999999998, "r_x1": 286.363, "r_y1": 83.82299999999998, "r_x2": 286.363, "r_y2": 76.12599999999998, "r_x3": 217.313, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi,", "orig": "In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 286.363, "r_y1": 94.78200000000004, "r_x2": 286.363, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 105.74000000000001, "r_x1": 85.722, "r_y1": 105.74000000000001, "r_x2": 85.722, "r_y2": 98.043, "r_x3": 70.031, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.889, "r_y0": 105.61099999999999, "r_x1": 199.933, "r_y1": 105.61099999999999, "r_x2": 199.933, "r_y2": 97.88099999999997, "r_x3": 87.889, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.936, "r_y0": 105.74000000000001, "r_x1": 286.363, "r_y1": 105.74000000000001, "r_x2": 286.363, "r_y2": 98.043, "r_x3": 199.936, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 116.69899999999996, "r_x1": 221.949, "r_y1": 116.69899999999996, "r_x2": 221.949, "r_y2": 109.00199999999995, "r_x3": 70.031, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 127.971, "r_x1": 286.359, "r_y1": 127.971, "r_x2": 286.359, "r_y2": 120.274, "r_x3": 70.035, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.92999999999995, "r_x1": 179.672, "r_y1": 138.92999999999995, "r_x2": 179.672, "r_y2": 131.23299999999995, "r_x3": 70.031, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.581, "r_y0": 138.92999999999995, "r_x1": 286.363, "r_y1": 138.92999999999995, "r_x2": 286.363, "r_y2": 131.23299999999995, "r_x3": 185.581, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.889, "r_x1": 113.115, "r_y1": 149.889, "r_x2": 113.115, "r_y2": 142.192, "r_x3": 70.031, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.342, "r_y0": 149.76, "r_x1": 235.308, "r_y1": 149.76, "r_x2": 235.308, "r_y2": 142.02999999999997, "r_x3": 116.342, "r_y3": 142.02999999999997, "coord_origin": "TOPLEFT"}, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.307, "r_y0": 149.889, "r_x1": 267.676, "r_y1": 149.889, "r_x2": 267.676, "r_y2": 142.192, "r_x3": 235.307, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 161.16099999999994, "r_x1": 218.779, "r_y1": 161.16099999999994, "r_x2": 218.779, "r_y2": 153.46400000000006, "r_x3": 70.035, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.98, "r_y0": 161.03200000000004, "r_x1": 286.363, "r_y1": 161.03200000000004, "r_x2": 286.363, "r_y2": 153.30200000000002, "r_x3": 220.98, "r_y3": 153.30200000000002, "coord_origin": "TOPLEFT"}, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 171.99099999999999, "r_x1": 125.264, "r_y1": 171.99099999999999, "r_x2": 125.264, "r_y2": 164.26099999999997, "r_x3": 70.031, "r_y3": 164.26099999999997, "coord_origin": "TOPLEFT"}, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.261, "r_y0": 172.12, "r_x1": 127.503, "r_y1": 172.12, "r_x2": 127.503, "r_y2": 164.423, "r_x3": 125.261, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.986, "r_y0": 172.12, "r_x1": 286.36, "r_y1": 172.12, "r_x2": 286.36, "r_y2": 164.423, "r_x3": 129.986, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": "pages 647-677. Springer London, London,", "orig": "pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.07799999999997, "r_x1": 97.917, "r_y1": 183.07799999999997, "r_x2": 97.917, "r_y2": 175.38099999999997, "r_x3": 70.031, "r_y3": 175.38099999999997, "coord_origin": "TOPLEFT"}, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 194.35000000000002, "r_x1": 91.936, "r_y1": 194.35000000000002, "r_x2": 91.936, "r_y2": 186.65300000000002, "r_x3": 70.035, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Herv\u00b4 e", "orig": "Herv\u00b4 e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.101, "r_y0": 194.35000000000002, "r_x1": 124.736, "r_y1": 194.35000000000002, "r_x2": 124.736, "r_y2": 186.65300000000002, "r_x3": 97.101, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "D\u00b4 ejean,", "orig": "D\u00b4 ejean,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.636, "r_y0": 194.35000000000002, "r_x1": 163.497, "r_y1": 194.35000000000002, "r_x2": 163.497, "r_y2": 186.65300000000002, "r_x3": 130.636, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Jean-Luc", "orig": "Jean-Luc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.662, "r_y0": 194.35000000000002, "r_x1": 200.923, "r_y1": 194.35000000000002, "r_x2": 200.923, "r_y2": 186.65300000000002, "r_x3": 168.662, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Meunier,", "orig": "Meunier,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.814, "r_y0": 194.35000000000002, "r_x1": 238.188, "r_y1": 194.35000000000002, "r_x2": 238.188, "r_y2": 186.65300000000002, "r_x3": 206.814, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Liangcai", "orig": "Liangcai", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.352, "r_y0": 194.35000000000002, "r_x1": 260.532, "r_y1": 194.35000000000002, "r_x2": 260.532, "r_y2": 186.65300000000002, "r_x3": 243.352, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Gao,", "orig": "Gao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.432, "r_y0": 194.35000000000002, "r_x1": 286.364, "r_y1": 194.35000000000002, "r_x2": 286.364, "r_y2": 186.65300000000002, "r_x3": 266.432, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Yilun", "orig": "Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.30899999999997, "r_x1": 269.605, "r_y1": 205.30899999999997, "r_x2": 269.605, "r_y2": 197.61199999999997, "r_x3": 70.031, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.411, "r_y0": 205.30899999999997, "r_x1": 286.363, "r_y1": 205.30899999999997, "r_x2": 286.363, "r_y2": 197.61199999999997, "r_x3": 274.411, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "IC-", "orig": "IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 216.26800000000003, "r_x1": 286.363, "r_y1": 216.26800000000003, "r_x2": 286.363, "r_y2": 208.57100000000003, "r_x3": 70.031, "r_y3": 208.57100000000003, "coord_origin": "TOPLEFT"}, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.22699999999998, "r_x1": 245.835, "r_y1": 227.22699999999998, "r_x2": 245.835, "r_y2": 219.52999999999997, "r_x3": 70.031, "r_y3": 219.52999999999997, "coord_origin": "TOPLEFT"}, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.49900000000002, "r_x1": 286.359, "r_y1": 238.49900000000002, "r_x2": 286.359, "r_y2": 230.80200000000002, "r_x3": 70.035, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.45799999999997, "r_x1": 286.363, "r_y1": 249.45799999999997, "r_x2": 286.363, "r_y2": 241.76099999999997, "r_x3": 70.031, "r_y3": 241.76099999999997, "coord_origin": "TOPLEFT"}, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.41600000000005, "r_x1": 108.398, "r_y1": 260.41600000000005, "r_x2": 108.398, "r_y2": 252.71900000000005, "r_x3": 70.031, "r_y3": 252.71900000000005, "coord_origin": "TOPLEFT"}, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.645, "r_y0": 260.28700000000003, "r_x1": 286.36, "r_y1": 260.28700000000003, "r_x2": 286.36, "r_y2": 252.55700000000002, "r_x3": 110.645, "r_y3": 252.55700000000002, "coord_origin": "TOPLEFT"}, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.246, "r_x1": 140.579, "r_y1": 271.246, "r_x2": 140.579, "r_y2": 263.51599999999996, "r_x3": 70.031, "r_y3": 263.51599999999996, "coord_origin": "TOPLEFT"}, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.578, "r_y0": 271.375, "r_x1": 266.475, "r_y1": 271.375, "r_x2": 266.475, "r_y2": 263.678, "r_x3": 140.578, "r_y3": 263.678, "coord_origin": "TOPLEFT"}, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.647, "r_x1": 286.367, "r_y1": 282.647, "r_x2": 286.367, "r_y2": 274.95000000000005, "r_x3": 70.035, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "MaxG\u00a8 obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "MaxG\u00a8 obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.606, "r_x1": 179.574, "r_y1": 293.606, "r_x2": 179.574, "r_y2": 285.909, "r_x3": 70.031, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.016, "r_y0": 293.606, "r_x1": 194.485, "r_y1": 293.606, "r_x2": 194.485, "r_y2": 285.909, "r_x3": 187.016, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.044, "r_y0": 293.477, "r_x1": 286.363, "r_y1": 293.477, "r_x2": 286.363, "r_y2": 285.747, "r_x3": 198.044, "r_y3": 285.747, "coord_origin": "TOPLEFT"}, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.436, "r_x1": 260.199, "r_y1": 304.436, "r_x2": 260.199, "r_y2": 296.706, "r_x3": 70.031, "r_y3": 296.706, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.198, "r_y0": 304.565, "r_x1": 262.44, "r_y1": 304.565, "r_x2": 262.44, "r_y2": 296.868, "r_x3": 260.198, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.945, "r_y0": 304.565, "r_x1": 286.362, "r_y1": 304.565, "r_x2": 286.362, "r_y2": 296.868, "r_x3": 265.945, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.524, "r_x1": 142.749, "r_y1": 315.524, "r_x2": 142.749, "r_y2": 307.827, "r_x3": 70.031, "r_y3": 307.827, "coord_origin": "TOPLEFT"}, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 326.796, "r_x1": 199.492, "r_y1": 326.796, "r_x2": 199.492, "r_y2": 319.099, "r_x3": 70.035, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.988, "r_y0": 326.796, "r_x1": 286.359, "r_y1": 326.796, "r_x2": 286.359, "r_y2": 319.099, "r_x3": 206.988, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 337.754, "r_x1": 176.283, "r_y1": 337.754, "r_x2": 176.283, "r_y2": 330.057, "r_x3": 70.031, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.604, "r_y0": 337.754, "r_x1": 190.073, "r_y1": 337.754, "r_x2": 190.073, "r_y2": 330.057, "r_x3": 182.604, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.283, "r_y0": 337.625, "r_x1": 286.363, "r_y1": 337.625, "r_x2": 286.363, "r_y2": 329.895, "r_x3": 193.283, "r_y3": 329.895, "coord_origin": "TOPLEFT"}, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.584, "r_x1": 206.347, "r_y1": 348.584, "r_x2": 206.347, "r_y2": 340.854, "r_x3": 70.031, "r_y3": 340.854, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (SDAIR'95)", "orig": "Analysis and Recognition (SDAIR'95)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.346, "r_y0": 348.713, "r_x1": 274.822, "r_y1": 348.713, "r_x2": 274.822, "r_y2": 341.016, "r_x3": 206.346, "r_y3": 341.016, "coord_origin": "TOPLEFT"}, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 359.985, "r_x1": 286.359, "r_y1": 359.985, "r_x2": 286.359, "r_y2": 352.288, "r_x3": 70.035, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.944, "r_x1": 234.125, "r_y1": 370.944, "r_x2": 234.125, "r_y2": 363.247, "r_x3": 70.031, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.052, "r_y0": 370.944, "r_x1": 286.363, "r_y1": 370.944, "r_x2": 286.363, "r_y2": 363.247, "r_x3": 240.052, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.903, "r_x1": 85.973, "r_y1": 381.903, "r_x2": 85.973, "r_y2": 374.206, "r_x3": 70.031, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "tors:", "orig": "tors:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.349, "r_y0": 381.903, "r_x1": 286.363, "r_y1": 381.903, "r_x2": 286.363, "r_y2": 374.206, "r_x3": 90.349, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "Cascade network for table detection in document im-", "orig": "Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 392.862, "r_x1": 286.363, "r_y1": 392.862, "r_x2": 286.363, "r_y2": 385.165, "r_x3": 70.031, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 114.576, "r_y1": 403.821, "r_x2": 114.576, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.804, "r_y0": 403.692, "r_x1": 186.729, "r_y1": 403.692, "r_x2": 186.729, "r_y2": 395.962, "r_x3": 117.804, "r_y3": 395.962, "coord_origin": "TOPLEFT"}, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.728, "r_y0": 403.821, "r_x1": 243.001, "r_y1": 403.821, "r_x2": 243.001, "r_y2": 396.124, "r_x3": 186.728, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 415.092, "r_x1": 286.359, "r_y1": 415.092, "r_x2": 286.359, "r_y2": 407.395, "r_x3": 70.035, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 426.051, "r_x1": 147.133, "r_y1": 426.051, "r_x2": 147.133, "r_y2": 418.354, "r_x3": 70.031, "r_y3": 418.354, "coord_origin": "TOPLEFT"}, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.156, "r_y0": 425.922, "r_x1": 286.36, "r_y1": 425.922, "r_x2": 286.36, "r_y2": 418.192, "r_x3": 149.156, "r_y3": 418.192, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.881, "r_x1": 213.484, "r_y1": 436.881, "r_x2": 213.484, "r_y2": 429.151, "r_x3": 70.031, "r_y3": 429.151, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.483, "r_y0": 437.01, "r_x1": 261.041, "r_y1": 437.01, "r_x2": 261.041, "r_y2": 429.313, "r_x3": 213.483, "r_y3": 429.313, "coord_origin": "TOPLEFT"}, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 448.282, "r_x1": 286.359, "r_y1": 448.282, "r_x2": 286.359, "r_y2": 440.585, "r_x3": 70.035, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 459.241, "r_x1": 202.743, "r_y1": 459.241, "r_x2": 202.743, "r_y2": 451.544, "r_x3": 70.031, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.001, "r_y0": 459.241, "r_x1": 286.363, "r_y1": 459.241, "r_x2": 286.363, "r_y2": 451.544, "r_x3": 209.001, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's so-", "orig": "Pingan-vcgroup's so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 470.2, "r_x1": 286.363, "r_y1": 470.2, "r_x2": 286.363, "r_y2": 462.503, "r_x3": 70.031, "r_y3": 462.503, "coord_origin": "TOPLEFT"}, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 481.159, "r_x1": 141.87, "r_y1": 481.159, "r_x2": 141.87, "r_y2": 473.462, "r_x3": 70.031, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.097, "r_y0": 481.03, "r_x1": 166.016, "r_y1": 481.03, "r_x2": 166.016, "r_y2": 473.3, "r_x3": 145.097, "r_y3": 473.3, "coord_origin": "TOPLEFT"}, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.015, "r_y0": 481.159, "r_x1": 259.902, "r_y1": 481.159, "r_x2": 259.902, "r_y2": 473.462, "r_x3": 166.015, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 492.43, "r_x1": 117.091, "r_y1": 492.43, "r_x2": 117.091, "r_y2": 484.733, "r_x3": 70.035, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Jianying Hu,", "orig": "Jianying Hu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.054, "r_y0": 492.43, "r_x1": 286.359, "r_y1": 492.43, "r_x2": 286.359, "r_y2": 484.733, "r_x3": 121.054, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 503.389, "r_x1": 132.15, "r_y1": 503.389, "r_x2": 132.15, "r_y2": 495.692, "r_x3": 70.031, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Gordon Wilfong.", "orig": "Gordon Wilfong.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.691, "r_y0": 503.389, "r_x1": 273.362, "r_y1": 503.389, "r_x2": 273.362, "r_y2": 495.692, "r_x3": 137.691, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Medium-independent table detection.", "orig": "Medium-independent table detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 503.389, "r_x1": 286.363, "r_y1": 503.389, "r_x2": 286.363, "r_y2": 495.692, "r_x3": 278.894, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 514.219, "r_x1": 106.883, "r_y1": 514.219, "r_x2": 106.883, "r_y2": 506.489, "r_x3": 70.031, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Document", "orig": "Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 111.796, "r_y0": 514.219, "r_x1": 155.041, "r_y1": 514.219, "r_x2": 155.041, "r_y2": 506.489, "r_x3": 111.796, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.946, "r_y0": 514.219, "r_x1": 173.396, "r_y1": 514.219, "r_x2": 173.396, "r_y2": 506.489, "r_x3": 159.946, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.309, "r_y0": 514.219, "r_x1": 211.046, "r_y1": 514.219, "r_x2": 211.046, "r_y2": 506.489, "r_x3": 178.309, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Retrieval", "orig": "Retrieval", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.959, "r_y0": 514.219, "r_x1": 227.409, "r_y1": 514.219, "r_x2": 227.409, "r_y2": 506.489, "r_x3": 215.959, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "VII", "orig": "VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.405, "r_y0": 514.348, "r_x1": 229.647, "r_y1": 514.348, "r_x2": 229.647, "r_y2": 506.651, "r_x3": 227.405, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.56, "r_y0": 514.348, "r_x1": 261.28, "r_y1": 514.348, "r_x2": 261.28, "r_y2": 506.651, "r_x3": 234.56, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "volume", "orig": "volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.185, "r_y0": 514.348, "r_x1": 286.359, "r_y1": 514.348, "r_x2": 286.359, "r_y2": 506.651, "r_x3": 266.185, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "3967,", "orig": "3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.307, "r_x1": 286.363, "r_y1": 525.307, "r_x2": 286.363, "r_y2": 517.61, "r_x3": 70.031, "r_y3": 517.61, "coord_origin": "TOPLEFT"}, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 536.266, "r_x1": 112.361, "r_y1": 536.266, "r_x2": 112.361, "r_y2": 528.569, "r_x3": 70.031, "r_y3": 528.569, "coord_origin": "TOPLEFT"}, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 547.538, "r_x1": 126.407, "r_y1": 547.538, "r_x2": 126.407, "r_y2": 539.841, "r_x3": 70.035, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "Matthew Hurst.", "orig": "Matthew Hurst.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.648, "r_y0": 547.538, "r_x1": 286.359, "r_y1": 547.538, "r_x2": 286.359, "r_y2": 539.841, "r_x3": 130.648, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "A constraint-based approach to table struc-", "orig": "A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 558.4970000000001, "r_x1": 124.654, "r_y1": 558.4970000000001, "r_x2": 124.654, "r_y2": 550.8, "r_x3": 70.031, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "ture derivation.", "orig": "ture derivation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.815, "r_y0": 558.4970000000001, "r_x1": 136.284, "r_y1": 558.4970000000001, "r_x2": 136.284, "r_y2": 550.8, "r_x3": 128.815, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.811, "r_y0": 558.3679999999999, "r_x1": 286.362, "r_y1": 558.3679999999999, "r_x2": 286.362, "r_y2": 550.638, "r_x3": 138.811, "r_y3": 550.638, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.327, "r_x1": 286.363, "r_y1": 569.327, "r_x2": 286.363, "r_y2": 561.597, "r_x3": 70.031, "r_y3": 561.597, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.2860000000001, "r_x1": 74.514, "r_y1": 580.2860000000001, "r_x2": 74.514, "r_y2": 572.556, "r_x3": 70.031, "r_y3": 572.556, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.514, "r_y0": 580.415, "r_x1": 76.756, "r_y1": 580.415, "r_x2": 76.756, "r_y2": 572.718, "r_x3": 74.514, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.06, "r_y0": 580.415, "r_x1": 286.363, "r_y1": 580.415, "r_x2": 286.363, "r_y2": 572.718, "r_x3": 79.06, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "orig": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.373, "r_x1": 82.647, "r_y1": 591.373, "r_x2": 82.647, "r_y2": 583.6759999999999, "r_x3": 70.031, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "ety.", "orig": "ety.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.875, "r_y0": 591.373, "r_x1": 90.358, "r_y1": 591.373, "r_x2": 90.358, "r_y2": 583.6759999999999, "r_x3": 85.875, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.645, "r_x1": 116.302, "r_y1": 602.645, "r_x2": 116.302, "r_y2": 594.948, "r_x3": 70.035, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Thotreingam", "orig": "Thotreingam", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.368, "r_y0": 602.645, "r_x1": 144.161, "r_y1": 602.645, "r_x2": 144.161, "r_y2": 594.948, "r_x3": 121.368, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Kasar,", "orig": "Kasar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.926, "r_y0": 602.645, "r_x1": 186.796, "r_y1": 602.645, "r_x2": 186.796, "r_y2": 594.948, "r_x3": 149.926, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Philippine", "orig": "Philippine", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.862, "r_y0": 602.645, "r_x1": 217.013, "r_y1": 602.645, "r_x2": 217.013, "r_y2": 594.948, "r_x3": 191.862, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Barlas,", "orig": "Barlas,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.778, "r_y0": 602.645, "r_x1": 257.146, "r_y1": 602.645, "r_x2": 257.146, "r_y2": 594.948, "r_x3": 222.778, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Sebastien", "orig": "Sebastien", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.203, "r_y0": 602.645, "r_x1": 286.359, "r_y1": 602.645, "r_x2": 286.359, "r_y2": 594.948, "r_x3": 262.203, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Adam,", "orig": "Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.604, "r_x1": 214.838, "r_y1": 613.604, "r_x2": 214.838, "r_y2": 605.907, "r_x3": 70.031, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Cl\u00b4 ement Chatelain, and Thierry Paquet.", "orig": "Cl\u00b4 ement Chatelain, and Thierry Paquet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.949, "r_y0": 613.604, "r_x1": 286.363, "r_y1": 613.604, "r_x2": 286.363, "r_y2": 605.907, "r_x3": 219.949, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Learning to detect", "orig": "Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.563, "r_x1": 286.363, "r_y1": 624.563, "r_x2": 286.363, "r_y2": 616.866, "r_x3": 70.031, "r_y3": 616.866, "coord_origin": "TOPLEFT"}, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.5219999999999, "r_x1": 77.5, "r_y1": 635.5219999999999, "r_x2": 77.5, "r_y2": 627.825, "r_x3": 70.031, "r_y3": 627.825, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.92, "r_y0": 635.393, "r_x1": 286.362, "r_y1": 635.393, "r_x2": 286.362, "r_y2": 627.663, "r_x3": 79.92, "r_y3": 627.663, "coord_origin": "TOPLEFT"}, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 646.352, "r_x1": 140.677, "r_y1": 646.352, "r_x2": 140.677, "r_y2": 638.6220000000001, "r_x3": 70.031, "r_y3": 638.6220000000001, "coord_origin": "TOPLEFT"}, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.676, "r_y0": 646.481, "r_x1": 264.439, "r_y1": 646.481, "r_x2": 264.439, "r_y2": 638.784, "r_x3": 140.676, "r_y3": 638.784, "coord_origin": "TOPLEFT"}, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 657.7529999999999, "r_x1": 91.447, "r_y1": 657.7529999999999, "r_x2": 91.447, "r_y2": 650.056, "r_x3": 70.035, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Pratik", "orig": "Pratik", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.092, "r_y0": 657.7529999999999, "r_x1": 119.745, "r_y1": 657.7529999999999, "r_x2": 119.745, "r_y2": 650.056, "r_x3": 96.092, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Kayal,", "orig": "Kayal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.99, "r_y0": 657.7529999999999, "r_x1": 149.397, "r_y1": 657.7529999999999, "r_x2": 149.397, "r_y2": 650.056, "r_x3": 124.99, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mrinal", "orig": "Mrinal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.042, "r_y0": 657.7529999999999, "r_x1": 180.188, "r_y1": 657.7529999999999, "r_x2": 180.188, "r_y2": 650.056, "r_x3": 154.042, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Anand,", "orig": "Anand,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.433, "r_y0": 657.7529999999999, "r_x1": 206.845, "r_y1": 657.7529999999999, "r_x2": 206.845, "r_y2": 650.056, "r_x3": 185.433, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Harsh", "orig": "Harsh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.489, "r_y0": 657.7529999999999, "r_x1": 234.147, "r_y1": 657.7529999999999, "r_x2": 234.147, "r_y2": 650.056, "r_x3": 211.489, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Desai,", "orig": "Desai,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.393, "r_y0": 657.7529999999999, "r_x1": 252.34, "r_y1": 657.7529999999999, "r_x2": 252.34, "r_y2": 650.056, "r_x3": 239.393, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.976, "r_y0": 657.7529999999999, "r_x1": 286.359, "r_y1": 657.7529999999999, "r_x2": 286.359, "r_y2": 650.056, "r_x3": 256.976, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mayank", "orig": "Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.711, "r_x1": 93.2, "r_y1": 668.711, "r_x2": 93.2, "r_y2": 661.014, "r_x3": 70.031, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.202, "r_y0": 668.711, "r_x1": 120.619, "r_y1": 668.711, "r_x2": 120.619, "r_y2": 661.014, "r_x3": 102.202, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Icdar", "orig": "Icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.672, "r_y0": 668.711, "r_x1": 238.922, "r_y1": 668.711, "r_x2": 238.922, "r_y2": 661.014, "r_x3": 124.672, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "2021 competition on scientific", "orig": "2021 competition on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.975, "r_y0": 668.711, "r_x1": 260.406, "r_y1": 668.711, "r_x2": 260.406, "r_y2": 661.014, "r_x3": 242.975, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.449, "r_y0": 668.711, "r_x1": 286.363, "r_y1": 668.711, "r_x2": 286.363, "r_y2": 661.014, "r_x3": 264.449, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.67, "r_x1": 171.997, "r_y1": 679.67, "r_x2": 171.997, "r_y2": 671.973, "r_x3": 70.031, "r_y3": 671.973, "coord_origin": "TOPLEFT"}, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 690.942, "r_x1": 130.612, "r_y1": 690.942, "r_x2": 130.612, "r_y2": 683.245, "r_x3": 70.035, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Harold W Kuhn.", "orig": "Harold W Kuhn.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.97, "r_y0": 690.942, "r_x1": 286.359, "r_y1": 690.942, "r_x2": 286.359, "r_y2": 683.245, "r_x3": 134.97, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "The hungarian method for the assignment", "orig": "The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 701.901, "r_x1": 102.158, "r_y1": 701.901, "r_x2": 102.158, "r_y2": 694.204, "r_x3": 70.031, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 107.55, "r_y0": 701.772, "r_x1": 231.475, "r_y1": 701.772, "r_x2": 231.475, "r_y2": 694.042, "r_x3": 107.55, "r_y3": 694.042, "coord_origin": "TOPLEFT"}, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.476, "r_y0": 701.901, "r_x1": 233.718, "r_y1": 701.901, "r_x2": 233.718, "r_y2": 694.204, "r_x3": 231.476, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.802, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 236.802, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "2(1-2):83-97,", "orig": "2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 97.917, "r_y1": 712.86, "r_x2": 97.917, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 83.82299999999998, "r_x1": 351.192, "r_y1": 83.82299999999998, "r_x2": 351.192, "r_y2": 76.12599999999998, "r_x3": 328.785, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Girish", "orig": "Girish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.308, "r_y0": 83.82299999999998, "r_x1": 389.291, "r_y1": 83.82299999999998, "r_x2": 389.291, "r_y2": 76.12599999999998, "r_x3": 355.308, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Kulkarni,", "orig": "Kulkarni,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.863, "r_y0": 83.82299999999998, "r_x1": 420.225, "r_y1": 83.82299999999998, "r_x2": 420.225, "r_y2": 76.12599999999998, "r_x3": 393.863, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Visruth", "orig": "Visruth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.331, "r_y0": 83.82299999999998, "r_x1": 454.961, "r_y1": 83.82299999999998, "r_x2": 454.961, "r_y2": 76.12599999999998, "r_x3": 424.331, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Premraj,", "orig": "Premraj,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.533, "r_y0": 83.82299999999998, "r_x1": 486.881, "r_y1": 83.82299999999998, "r_x2": 486.881, "r_y2": 76.12599999999998, "r_x3": 459.533, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Vicente", "orig": "Vicente", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.988, "r_y0": 83.82299999999998, "r_x1": 524.1, "r_y1": 83.82299999999998, "r_x2": 524.1, "r_y2": 76.12599999999998, "r_x3": 490.988, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Ordonez,", "orig": "Ordonez,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.673, "r_y0": 83.82299999999998, "r_x1": 545.109, "r_y1": 83.82299999999998, "r_x2": 545.109, "r_y2": 76.12599999999998, "r_x3": 528.673, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Sag-", "orig": "Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 545.113, "r_y1": 94.78099999999995, "r_x2": 545.113, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.74000000000001, "r_x1": 390.963, "r_y1": 105.74000000000001, "r_x2": 390.963, "r_y2": 98.043, "r_x3": 328.781, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.27, "r_y0": 105.74000000000001, "r_x1": 435.14, "r_y1": 105.74000000000001, "r_x2": 435.14, "r_y2": 98.043, "r_x3": 400.27, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.713, "r_y0": 105.74000000000001, "r_x1": 494.507, "r_y1": 105.74000000000001, "r_x2": 494.507, "r_y2": 98.043, "r_x3": 441.713, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Understanding", "orig": "Understanding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.649, "r_y0": 105.74000000000001, "r_x1": 545.113, "r_y1": 105.74000000000001, "r_x2": 545.113, "r_y2": 98.043, "r_x3": 498.649, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "and generat-", "orig": "and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 440.807, "r_y1": 116.69899999999996, "r_x2": 440.807, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.635, "r_y0": 116.57000000000005, "r_x1": 545.113, "r_y1": 116.57000000000005, "r_x2": 545.113, "r_y2": 108.84000000000003, "r_x3": 446.635, "r_y3": 108.84000000000003, "coord_origin": "TOPLEFT"}, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 127.529, "r_x1": 471.132, "r_y1": 127.529, "r_x2": 471.132, "r_y2": 119.79899999999998, "r_x3": 328.781, "r_y3": 119.79899999999998, "coord_origin": "TOPLEFT"}, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.133, "r_y0": 127.65800000000002, "r_x1": 473.375, "r_y1": 127.65800000000002, "r_x2": 473.375, "r_y2": 119.96100000000001, "r_x3": 471.133, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.127, "r_y0": 127.65800000000002, "r_x1": 545.115, "r_y1": 127.65800000000002, "r_x2": 545.115, "r_y2": 119.96100000000001, "r_x3": 476.127, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": "35(12):2891-2903,", "orig": "35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 138.61699999999996, "r_x1": 356.667, "r_y1": 138.61699999999996, "r_x2": 356.667, "r_y2": 130.91999999999996, "r_x3": 328.781, "r_y3": 130.91999999999996, "coord_origin": "TOPLEFT"}, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 150.063, "r_x1": 375.698, "r_y1": 150.063, "r_x2": 375.698, "r_y2": 142.36599999999999, "r_x3": 328.785, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Minghao Li,", "orig": "Minghao Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.557, "r_y0": 150.063, "r_x1": 392.51, "r_y1": 150.063, "r_x2": 392.51, "r_y2": 142.36599999999999, "r_x3": 380.557, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Lei", "orig": "Lei", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.84, "r_y0": 150.063, "r_x1": 412.038, "r_y1": 150.063, "r_x2": 412.038, "r_y2": 142.36599999999999, "r_x3": 396.84, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Cui,", "orig": "Cui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.889, "r_y0": 150.063, "r_x1": 478.246, "r_y1": 150.063, "r_x2": 478.246, "r_y2": 142.36599999999999, "r_x3": 416.889, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Shaohan Huang,", "orig": "Shaohan Huang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.097, "r_y0": 150.063, "r_x1": 500.035, "r_y1": 150.063, "r_x2": 500.035, "r_y2": 142.36599999999999, "r_x3": 483.097, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Furu", "orig": "Furu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.365, "r_y0": 150.063, "r_x1": 520.828, "r_y1": 150.063, "r_x2": 520.828, "r_y2": 142.36599999999999, "r_x3": 504.365, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Wei,", "orig": "Wei,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 525.679, "r_y0": 150.063, "r_x1": 545.109, "r_y1": 150.063, "r_x2": 545.109, "r_y2": 142.36599999999999, "r_x3": 525.679, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Ming", "orig": "Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.02099999999996, "r_x1": 414.446, "r_y1": 161.02099999999996, "r_x2": 414.446, "r_y2": 153.32399999999996, "r_x3": 328.781, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 421.825, "r_y0": 161.02099999999996, "r_x1": 461.448, "r_y1": 161.02099999999996, "r_x2": 461.448, "r_y2": 153.32399999999996, "r_x3": 421.825, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Tablebank:", "orig": "Tablebank:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.828, "r_y0": 161.02099999999996, "r_x1": 545.113, "r_y1": 161.02099999999996, "r_x2": 545.113, "r_y2": 153.32399999999996, "r_x3": 466.828, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "A benchmark dataset", "orig": "A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 171.98000000000002, "r_x1": 493.628, "r_y1": 171.98000000000002, "r_x2": 493.628, "r_y2": 164.28300000000002, "r_x3": 328.781, "r_y3": 164.28300000000002, "coord_origin": "TOPLEFT"}, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 183.42600000000004, "r_x1": 545.109, "r_y1": 183.42600000000004, "r_x2": 545.109, "r_y2": 175.72900000000004, "r_x3": 328.785, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 194.385, "r_x1": 375.397, "r_y1": 194.385, "r_x2": 375.397, "r_y2": 186.688, "r_x3": 328.781, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Xianhui Liu.", "orig": "Xianhui Liu.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.154, "r_y0": 194.385, "r_x1": 399.58, "r_y1": 194.385, "r_x2": 399.58, "r_y2": 186.688, "r_x3": 381.154, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Gfte:", "orig": "Gfte:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.937, "r_y0": 194.385, "r_x1": 545.113, "r_y1": 194.385, "r_x2": 545.113, "r_y2": 186.688, "r_x3": 403.937, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Graph-based financial table extraction.", "orig": "Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 205.34400000000005, "r_x1": 545.113, "r_y1": 205.34400000000005, "r_x2": 545.113, "r_y2": 197.64700000000005, "r_x3": 328.781, "r_y3": 197.64700000000005, "coord_origin": "TOPLEFT"}, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 216.303, "r_x1": 545.113, "r_y1": 216.303, "r_x2": 545.113, "r_y2": 208.606, "r_x3": 328.781, "r_y3": 208.606, "coord_origin": "TOPLEFT"}, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 227.26199999999994, "r_x1": 365.382, "r_y1": 227.26199999999994, "r_x2": 365.382, "r_y2": 219.56500000000005, "r_x3": 328.781, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "Escalante,", "orig": "Escalante,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.237, "r_y0": 227.26199999999994, "r_x1": 479.264, "r_y1": 227.26199999999994, "r_x2": 479.264, "r_y2": 219.56500000000005, "r_x3": 369.237, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "and Roberto Vezzani, editors,", "orig": "and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 227.13300000000004, "r_x1": 545.113, "r_y1": 227.13300000000004, "r_x2": 545.113, "r_y2": 219.40300000000002, "r_x3": 483.119, "r_y3": 219.40300000000002, "coord_origin": "TOPLEFT"}, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 238.091, "r_x1": 519.398, "r_y1": 238.091, "r_x2": 519.398, "r_y2": 230.361, "r_x3": 328.781, "r_y3": 230.361, "coord_origin": "TOPLEFT"}, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 519.401, "r_y0": 238.22000000000003, "r_x1": 521.643, "r_y1": 238.22000000000003, "r_x2": 521.643, "r_y2": 230.52300000000002, "r_x3": 519.401, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.691, "r_y0": 238.22000000000003, "r_x1": 545.108, "r_y1": 238.22000000000003, "r_x2": 545.108, "r_y2": 230.52300000000002, "r_x3": 524.691, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 249.17899999999997, "r_x1": 545.113, "r_y1": 249.17899999999997, "r_x2": 545.113, "r_y2": 241.48199999999997, "r_x3": 328.781, "r_y3": 241.48199999999997, "coord_origin": "TOPLEFT"}, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 260.13800000000003, "r_x1": 333.264, "r_y1": 260.13800000000003, "r_x2": 333.264, "r_y2": 252.44100000000003, "r_x3": 328.781, "r_y3": 252.44100000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 271.58399999999995, "r_x1": 545.109, "r_y1": 271.58399999999995, "r_x2": 545.109, "r_y2": 263.88699999999994, "r_x3": 328.785, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 282.543, "r_x1": 545.113, "r_y1": 282.543, "r_x2": 545.113, "r_y2": 274.846, "r_x3": 328.781, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 293.502, "r_x1": 527.118, "r_y1": 293.502, "r_x2": 527.118, "r_y2": 285.805, "r_x3": 328.781, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.664, "r_y0": 293.502, "r_x1": 545.113, "r_y1": 293.502, "r_x2": 545.113, "r_y2": 285.805, "r_x3": 531.664, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ro-", "orig": "Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 304.461, "r_x1": 343.549, "r_y1": 304.461, "r_x2": 343.549, "r_y2": 296.764, "r_x3": 328.781, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "bust", "orig": "bust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.44, "r_y0": 304.461, "r_x1": 545.113, "r_y1": 304.461, "r_x2": 545.113, "r_y2": 296.764, "r_x3": 347.44, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "pdf document conversion using recurrent neural net-", "orig": "pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 315.419, "r_x1": 352.847, "r_y1": 315.419, "r_x2": 352.847, "r_y2": 307.722, "r_x3": 328.781, "r_y3": 307.722, "coord_origin": "TOPLEFT"}, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.236, "r_y0": 315.29, "r_x1": 545.114, "r_y1": 315.29, "r_x2": 545.114, "r_y2": 307.56, "r_x3": 360.236, "r_y3": 307.56, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 326.249, "r_x1": 371.022, "r_y1": 326.249, "r_x2": 371.022, "r_y2": 318.519, "r_x3": 328.781, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.021, "r_y0": 326.378, "r_x1": 502.262, "r_y1": 326.378, "r_x2": 502.262, "r_y2": 318.681, "r_x3": 371.021, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 337.824, "r_x1": 545.109, "r_y1": 337.824, "r_x2": 545.109, "r_y2": 330.127, "r_x3": 328.785, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 348.783, "r_x1": 456.821, "r_y1": 348.783, "r_x2": 456.821, "r_y2": 341.086, "r_x3": 328.781, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Yongpan Wang, and Gui-Song Xia.", "orig": "Yongpan Wang, and Gui-Song Xia.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.991, "r_y0": 348.783, "r_x1": 545.113, "r_y1": 348.783, "r_x2": 545.113, "r_y2": 341.086, "r_x3": 460.991, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Parsing table structures", "orig": "Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 359.742, "r_x1": 370.421, "r_y1": 359.742, "r_x2": 370.421, "r_y2": 352.045, "r_x3": 328.781, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "in the wild.", "orig": "in the wild.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.308, "r_y0": 359.742, "r_x1": 382.777, "r_y1": 359.742, "r_x2": 382.777, "r_y2": 352.045, "r_x3": 375.308, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.541, "r_y0": 359.613, "r_x1": 545.116, "r_y1": 359.613, "r_x2": 545.116, "r_y2": 351.883, "r_x3": 385.541, "r_y3": 351.883, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 370.572, "r_x1": 443.596, "r_y1": 370.572, "r_x2": 443.596, "r_y2": 362.842, "r_x3": 328.781, "r_y3": 362.842, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 443.594, "r_y0": 370.701, "r_x1": 534.486, "r_y1": 370.701, "r_x2": 534.486, "r_y2": 363.004, "r_x3": 443.594, "r_y3": 363.004, "coord_origin": "TOPLEFT"}, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 382.146, "r_x1": 362.66, "r_y1": 382.146, "r_x2": 362.66, "r_y2": 374.449, "r_x3": 328.785, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.695, "r_y0": 382.146, "r_x1": 389.613, "r_y1": 382.146, "r_x2": 389.613, "r_y2": 374.449, "r_x3": 368.695, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.648, "r_y0": 382.146, "r_x1": 424.564, "r_y1": 382.146, "r_x2": 424.564, "r_y2": 374.449, "r_x3": 395.648, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.549, "r_y0": 382.146, "r_x1": 488.504, "r_y1": 382.146, "r_x2": 488.504, "r_y2": 374.449, "r_x3": 431.549, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "D Vishwanath,", "orig": "D Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.48, "r_y0": 382.146, "r_x1": 515.412, "r_y1": 382.146, "r_x2": 515.412, "r_y2": 374.449, "r_x3": 495.48, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 521.446, "r_y0": 382.146, "r_x1": 545.109, "r_y1": 382.146, "r_x2": 545.109, "r_y2": 374.449, "r_x3": 521.446, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 393.105, "r_x1": 460.318, "r_y1": 393.105, "r_x2": 460.318, "r_y2": 385.408, "r_x3": 328.781, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Monika Sharma, and Lovekesh Vig.", "orig": "Monika Sharma, and Lovekesh Vig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.393, "r_y0": 393.105, "r_x1": 498.542, "r_y1": 393.105, "r_x2": 498.542, "r_y2": 385.408, "r_x3": 465.393, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Tablenet:", "orig": "Tablenet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.469, "r_y0": 393.105, "r_x1": 545.113, "r_y1": 393.105, "r_x2": 545.113, "r_y2": 385.408, "r_x3": 502.469, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Deep learn-", "orig": "Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 404.064, "r_x1": 545.113, "r_y1": 404.064, "r_x2": 545.113, "r_y2": 396.367, "r_x3": 328.781, "r_y3": 396.367, "coord_origin": "TOPLEFT"}, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 415.023, "r_x1": 478.009, "r_y1": 415.023, "r_x2": 478.009, "r_y2": 407.326, "r_x3": 328.781, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 484.07, "r_y0": 415.023, "r_x1": 491.539, "r_y1": 415.023, "r_x2": 491.539, "r_y2": 407.326, "r_x3": 484.07, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.668, "r_y0": 414.894, "r_x1": 545.113, "r_y1": 414.894, "r_x2": 545.113, "r_y2": 407.164, "r_x3": 494.668, "r_y3": 407.164, "coord_origin": "TOPLEFT"}, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 425.853, "r_x1": 349.709, "r_y1": 425.853, "r_x2": 349.709, "r_y2": 418.123, "r_x3": 328.781, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "tional", "orig": "tional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.295, "r_y0": 425.853, "r_x1": 545.113, "r_y1": 425.853, "r_x2": 545.113, "r_y2": 418.123, "r_x3": 353.295, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 436.812, "r_x1": 360.836, "r_y1": 436.812, "r_x2": 360.836, "r_y2": 429.082, "r_x3": 328.781, "r_y3": 429.082, "coord_origin": "TOPLEFT"}, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.836, "r_y0": 436.941, "r_x1": 475.633, "r_y1": 436.941, "r_x2": 475.633, "r_y2": 429.244, "r_x3": 360.836, "r_y3": 429.244, "coord_origin": "TOPLEFT"}, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 448.386, "r_x1": 545.109, "r_y1": 448.386, "r_x2": 545.109, "r_y2": 440.689, "r_x3": 328.785, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 459.345, "r_x1": 545.113, "r_y1": 459.345, "r_x2": 545.113, "r_y2": 451.648, "r_x3": 328.781, "r_y3": 451.648, "coord_origin": "TOPLEFT"}, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 470.304, "r_x1": 343.477, "r_y1": 470.304, "r_x2": 343.477, "r_y2": 462.607, "r_x3": 328.781, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Lin,", "orig": "Lin,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.601, "r_y0": 470.304, "r_x1": 373.496, "r_y1": 470.304, "r_x2": 373.496, "r_y2": 462.607, "r_x3": 347.601, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Natalia", "orig": "Natalia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.244, "r_y0": 470.304, "r_x1": 420.83, "r_y1": 470.304, "r_x2": 420.83, "r_y2": 462.607, "r_x3": 377.244, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Gimelshein,", "orig": "Gimelshein,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.955, "r_y0": 470.304, "r_x1": 473.239, "r_y1": 470.304, "r_x2": 473.239, "r_y2": 462.607, "r_x3": 424.955, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Luca Antiga,", "orig": "Luca Antiga,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.363, "r_y0": 470.304, "r_x1": 545.113, "r_y1": 470.304, "r_x2": 545.113, "r_y2": 462.607, "r_x3": 477.363, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Alban Desmaison,", "orig": "Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 481.263, "r_x1": 545.113, "r_y1": 481.263, "r_x2": 545.113, "r_y2": 473.566, "r_x3": 328.781, "r_y3": 473.566, "coord_origin": "TOPLEFT"}, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 492.222, "r_x1": 545.113, "r_y1": 492.222, "r_x2": 545.113, "r_y2": 484.525, "r_x3": 328.781, "r_y3": 484.525, "coord_origin": "TOPLEFT"}, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 503.181, "r_x1": 545.113, "r_y1": 503.181, "r_x2": 545.113, "r_y2": 495.484, "r_x3": 328.781, "r_y3": 495.484, "coord_origin": "TOPLEFT"}, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 514.14, "r_x1": 545.113, "r_y1": 514.14, "r_x2": 545.113, "r_y2": 506.443, "r_x3": 328.781, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 525.0989999999999, "r_x1": 545.11, "r_y1": 525.0989999999999, "r_x2": 545.11, "r_y2": 517.402, "r_x3": 328.781, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4 e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4 e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 536.057, "r_x1": 434.567, "r_y1": 536.057, "r_x2": 434.567, "r_y2": 528.36, "r_x3": 328.781, "r_y3": 528.36, "coord_origin": "TOPLEFT"}, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.864, "r_y0": 535.928, "r_x1": 545.111, "r_y1": 535.928, "r_x2": 545.111, "r_y2": 528.198, "r_x3": 437.864, "r_y3": 528.198, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 546.887, "r_x1": 425.735, "r_y1": 546.887, "r_x2": 425.735, "r_y2": 539.157, "r_x3": 328.781, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.736, "r_y0": 547.016, "r_x1": 545.115, "r_y1": 547.016, "r_x2": 545.115, "r_y2": 539.319, "r_x3": 425.736, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 557.975, "r_x1": 399.741, "r_y1": 557.975, "r_x2": 399.741, "r_y2": 550.278, "r_x3": 328.781, "r_y3": 550.278, "coord_origin": "TOPLEFT"}, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 569.421, "r_x1": 395.433, "r_y1": 569.421, "r_x2": 395.433, "r_y2": 561.7239999999999, "r_x3": 328.785, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Devashish Prasad,", "orig": "Devashish Prasad,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.369, "r_y0": 569.421, "r_x1": 545.109, "r_y1": 569.421, "r_x2": 545.109, "r_y2": 561.7239999999999, "r_x3": 399.369, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 580.38, "r_x1": 545.113, "r_y1": 580.38, "r_x2": 545.113, "r_y2": 572.683, "r_x3": 328.781, "r_y3": 572.683, "coord_origin": "TOPLEFT"}, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 591.3389999999999, "r_x1": 545.113, "r_y1": 591.3389999999999, "r_x2": 545.113, "r_y2": 583.642, "r_x3": 328.781, "r_y3": 583.642, "coord_origin": "TOPLEFT"}, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 602.298, "r_x1": 418.266, "r_y1": 602.298, "r_x2": 418.266, "r_y2": 594.601, "r_x3": 328.781, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "image-based documents.", "orig": "image-based documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.148, "r_y0": 602.298, "r_x1": 431.617, "r_y1": 602.298, "r_x2": 431.617, "r_y2": 594.601, "r_x3": 424.148, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.691, "r_y0": 602.169, "r_x1": 545.112, "r_y1": 602.169, "r_x2": 545.112, "r_y2": 594.439, "r_x3": 434.691, "r_y3": 594.439, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 613.127, "r_x1": 369.784, "r_y1": 613.127, "r_x2": 369.784, "r_y2": 605.3969999999999, "r_x3": 328.781, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Conference", "orig": "Conference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.008, "r_y0": 613.127, "r_x1": 449.549, "r_y1": 613.127, "r_x2": 449.549, "r_y2": 605.3969999999999, "r_x3": 374.008, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "on Computer Vision", "orig": "on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.782, "r_y0": 613.127, "r_x1": 497.636, "r_y1": 613.127, "r_x2": 497.636, "r_y2": 605.3969999999999, "r_x3": 453.782, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "and Pattern", "orig": "and Pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.868, "r_y0": 613.127, "r_x1": 545.113, "r_y1": 613.127, "r_x2": 545.113, "r_y2": 605.3969999999999, "r_x3": 501.868, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 624.086, "r_x1": 367.803, "r_y1": 624.086, "r_x2": 367.803, "r_y2": 616.356, "r_x3": 328.781, "r_y3": 616.356, "coord_origin": "TOPLEFT"}, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.802, "r_y0": 624.215, "r_x1": 458.694, "r_y1": 624.215, "r_x2": 458.694, "r_y2": 616.518, "r_x3": 367.802, "r_y3": 616.518, "coord_origin": "TOPLEFT"}, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 635.6610000000001, "r_x1": 545.109, "r_y1": 635.6610000000001, "r_x2": 545.109, "r_y2": 627.9639999999999, "r_x3": 328.785, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 646.62, "r_x1": 545.113, "r_y1": 646.62, "r_x2": 545.113, "r_y2": 638.923, "r_x3": 328.781, "r_y3": 638.923, "coord_origin": "TOPLEFT"}, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 657.579, "r_x1": 336.25, "r_y1": 657.579, "r_x2": 336.25, "r_y2": 649.8820000000001, "r_x3": 328.781, "r_y3": 649.8820000000001, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.116, "r_y1": 657.45, "r_x2": 545.116, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 668.409, "r_x1": 406.322, "r_y1": 668.409, "r_x2": 406.322, "r_y2": 660.679, "r_x3": 328.781, "r_y3": 660.679, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 668.538, "r_x1": 521.119, "r_y1": 668.538, "r_x2": 521.119, "r_y2": 660.841, "r_x3": 406.322, "r_y3": 660.841, "coord_origin": "TOPLEFT"}, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 679.983, "r_x1": 400.857, "r_y1": 679.983, "r_x2": 400.857, "r_y2": 672.2860000000001, "r_x3": 328.785, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Hamid Rezatofighi,", "orig": "Hamid Rezatofighi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 405.403, "r_y0": 679.983, "r_x1": 453.571, "r_y1": 679.983, "r_x2": 453.571, "r_y2": 672.2860000000001, "r_x3": 405.403, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Nathan Tsoi,", "orig": "Nathan Tsoi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.117, "r_y0": 679.983, "r_x1": 521.635, "r_y1": 679.983, "r_x2": 521.635, "r_y2": 672.2860000000001, "r_x3": 458.117, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "JunYoung Gwak,", "orig": "JunYoung Gwak,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.181, "r_y0": 679.983, "r_x1": 545.109, "r_y1": 679.983, "r_x2": 545.109, "r_y2": 672.2860000000001, "r_x3": 526.181, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Amir", "orig": "Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 690.942, "r_x1": 482.815, "r_y1": 690.942, "r_x2": 482.815, "r_y2": 683.245, "r_x3": 328.781, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.751, "r_y0": 690.942, "r_x1": 545.113, "r_y1": 690.942, "r_x2": 545.113, "r_y2": 683.245, "r_x3": 488.751, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 701.901, "r_x1": 545.113, "r_y1": 701.901, "r_x2": 545.113, "r_y2": 694.204, "r_x3": 328.781, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 367.74, "r_y1": 712.86, "r_x2": 367.74, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "regression.", "orig": "regression.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.685, "r_y0": 712.86, "r_x1": 379.154, "r_y1": 712.86, "r_x2": 379.154, "r_y2": 705.163, "r_x3": 371.685, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.616, "r_y0": 712.731, "r_x1": 545.109, "r_y1": 712.731, "r_x2": 545.109, "r_y2": 705.001, "r_x3": 381.616, "r_y3": 705.001, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 25, "label": "list_item", "bbox": {"l": 70.031, "t": 76.12599999999998, "r": 212.373, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7310384511947632, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 76.12599999999998, "r": 323.8, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9389600157737732, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 54.595, "t": 120.274, "r": 65.05, "b": 127.971, "coord_origin": "TOPLEFT"}, "confidence": 0.9372755885124207, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 142.36599999999999, "r": 323.8, "b": 150.063, "coord_origin": "TOPLEFT"}, "confidence": 0.9253129959106445, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 54.595, "t": 153.46400000000006, "r": 65.05, "b": 161.16099999999994, "coord_origin": "TOPLEFT"}, "confidence": 0.9378374218940735, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "list_item", "bbox": {"l": 308.862, "t": 175.72900000000004, "r": 323.8, "b": 183.42600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9299732446670532, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "list_item", "bbox": {"l": 54.595, "t": 186.65300000000002, "r": 65.05, "b": 194.35000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9648825526237488, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "list_item", "bbox": {"l": 54.595, "t": 230.80200000000002, "r": 65.05, "b": 238.49900000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9620943069458008, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 308.862, "t": 263.88699999999994, "r": 323.8, "b": 271.58399999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.937321662902832, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 54.595, "t": 274.95000000000005, "r": 65.05, "b": 282.647, "coord_origin": "TOPLEFT"}, "confidence": 0.9555517435073853, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 54.595, "t": 319.099, "r": 65.05, "b": 326.796, "coord_origin": "TOPLEFT"}, "confidence": 0.9479843378067017, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 330.127, "r": 323.8, "b": 337.824, "coord_origin": "TOPLEFT"}, "confidence": 0.9027292728424072, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 54.595, "t": 352.288, "r": 65.05, "b": 359.985, "coord_origin": "TOPLEFT"}, "confidence": 0.9484425187110901, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 374.449, "r": 323.8, "b": 382.146, "coord_origin": "TOPLEFT"}, "confidence": 0.882714569568634, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 54.595, "t": 407.395, "r": 65.05, "b": 415.092, "coord_origin": "TOPLEFT"}, "confidence": 0.9330756664276123, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "list_item", "bbox": {"l": 50.112, "t": 440.585, "r": 65.05, "b": 448.282, "coord_origin": "TOPLEFT"}, "confidence": 0.9274735450744629, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "list_item", "bbox": {"l": 308.862, "t": 440.689, "r": 323.8, "b": 448.386, "coord_origin": "TOPLEFT"}, "confidence": 0.8896440863609314, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 484.733, "r": 65.05, "b": 492.43, "coord_origin": "TOPLEFT"}, "confidence": 0.9299950003623962, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 539.841, "r": 65.05, "b": 547.538, "coord_origin": "TOPLEFT"}, "confidence": 0.9394103288650513, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "list_item", "bbox": {"l": 308.862, "t": 561.7239999999999, "r": 323.8, "b": 569.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9025435447692871, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 594.948, "r": 65.05, "b": 602.645, "coord_origin": "TOPLEFT"}, "confidence": 0.9298838973045349, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "list_item", "bbox": {"l": 308.862, "t": 627.9639999999999, "r": 323.8, "b": 635.6610000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.8777532577514648, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "list_item", "bbox": {"l": 50.112, "t": 650.056, "r": 65.05, "b": 657.7529999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9115257263183594, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "list_item", "bbox": {"l": 308.862, "t": 672.2860000000001, "r": 323.8, "b": 679.983, "coord_origin": "TOPLEFT"}, "confidence": 0.8654531240463257, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "list_item", "bbox": {"l": 50.112, "t": 683.245, "r": 65.05, "b": 690.942, "coord_origin": "TOPLEFT"}, "confidence": 0.912230372428894, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8797808885574341, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "list_item", "id": 25, "page_no": 8, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 70.031, "t": 76.12599999999998, "r": 212.373, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7310384511947632, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "end object detection with transformers."}, {"label": "list_item", "id": 6, "page_no": 8, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 76.12599999999998, "r": 323.8, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9389600157737732, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[16]"}, {"label": "list_item", "id": 9, "page_no": 8, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 54.595, "t": 120.274, "r": 65.05, "b": 127.971, "coord_origin": "TOPLEFT"}, "confidence": 0.9372755885124207, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[2]"}, {"label": "list_item", "id": 15, "page_no": 8, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 142.36599999999999, "r": 323.8, "b": 150.063, "coord_origin": "TOPLEFT"}, "confidence": 0.9253129959106445, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[17]"}, {"label": "list_item", "id": 7, "page_no": 8, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 54.595, "t": 153.46400000000006, "r": 65.05, "b": 161.16099999999994, "coord_origin": "TOPLEFT"}, "confidence": 0.9378374218940735, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[3]"}, {"label": "list_item", "id": 12, "page_no": 8, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 308.862, "t": 175.72900000000004, "r": 323.8, "b": 183.42600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9299732446670532, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[18]"}, {"label": "list_item", "id": 0, "page_no": 8, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 54.595, "t": 186.65300000000002, "r": 65.05, "b": 194.35000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9648825526237488, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[4]"}, {"label": "list_item", "id": 1, "page_no": 8, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 54.595, "t": 230.80200000000002, "r": 65.05, "b": 238.49900000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9620943069458008, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[5]"}, {"label": "list_item", "id": 8, "page_no": 8, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 308.862, "t": 263.88699999999994, "r": 323.8, "b": 271.58399999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.937321662902832, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[19]"}, {"label": "list_item", "id": 2, "page_no": 8, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 54.595, "t": 274.95000000000005, "r": 65.05, "b": 282.647, "coord_origin": "TOPLEFT"}, "confidence": 0.9555517435073853, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[6]"}, {"label": "list_item", "id": 4, "page_no": 8, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 54.595, "t": 319.099, "r": 65.05, "b": 326.796, "coord_origin": "TOPLEFT"}, "confidence": 0.9479843378067017, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[7]"}, {"label": "list_item", "id": 18, "page_no": 8, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 330.127, "r": 323.8, "b": 337.824, "coord_origin": "TOPLEFT"}, "confidence": 0.9027292728424072, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[20]"}, {"label": "list_item", "id": 3, "page_no": 8, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 54.595, "t": 352.288, "r": 65.05, "b": 359.985, "coord_origin": "TOPLEFT"}, "confidence": 0.9484425187110901, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[8]"}, {"label": "list_item", "id": 21, "page_no": 8, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 374.449, "r": 323.8, "b": 382.146, "coord_origin": "TOPLEFT"}, "confidence": 0.882714569568634, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[21]"}, {"label": "list_item", "id": 10, "page_no": 8, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 54.595, "t": 407.395, "r": 65.05, "b": 415.092, "coord_origin": "TOPLEFT"}, "confidence": 0.9330756664276123, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[9]"}, {"label": "list_item", "id": 14, "page_no": 8, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 50.112, "t": 440.585, "r": 65.05, "b": 448.282, "coord_origin": "TOPLEFT"}, "confidence": 0.9274735450744629, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[10]"}, {"label": "list_item", "id": 20, "page_no": 8, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 308.862, "t": 440.689, "r": 323.8, "b": 448.386, "coord_origin": "TOPLEFT"}, "confidence": 0.8896440863609314, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[22]"}, {"label": "list_item", "id": 11, "page_no": 8, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 484.733, "r": 65.05, "b": 492.43, "coord_origin": "TOPLEFT"}, "confidence": 0.9299950003623962, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[11]"}, {"label": "list_item", "id": 5, "page_no": 8, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 539.841, "r": 65.05, "b": 547.538, "coord_origin": "TOPLEFT"}, "confidence": 0.9394103288650513, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[12]"}, {"label": "list_item", "id": 19, "page_no": 8, "cluster": {"id": 19, "label": "list_item", "bbox": {"l": 308.862, "t": 561.7239999999999, "r": 323.8, "b": 569.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9025435447692871, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[23]"}, {"label": "list_item", "id": 13, "page_no": 8, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 594.948, "r": 65.05, "b": 602.645, "coord_origin": "TOPLEFT"}, "confidence": 0.9298838973045349, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[13]"}, {"label": "list_item", "id": 23, "page_no": 8, "cluster": {"id": 23, "label": "list_item", "bbox": {"l": 308.862, "t": 627.9639999999999, "r": 323.8, "b": 635.6610000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.8777532577514648, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[24]"}, {"label": "list_item", "id": 17, "page_no": 8, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 50.112, "t": 650.056, "r": 65.05, "b": 657.7529999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9115257263183594, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[14]"}, {"label": "list_item", "id": 24, "page_no": 8, "cluster": {"id": 24, "label": "list_item", "bbox": {"l": 308.862, "t": 672.2860000000001, "r": 323.8, "b": 679.983, "coord_origin": "TOPLEFT"}, "confidence": 0.8654531240463257, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[25]"}, {"label": "list_item", "id": 16, "page_no": 8, "cluster": {"id": 16, "label": "list_item", "bbox": {"l": 50.112, "t": 683.245, "r": 65.05, "b": 690.942, "coord_origin": "TOPLEFT"}, "confidence": 0.912230372428894, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[15]"}, {"label": "page_footer", "id": 22, "page_no": 8, "cluster": {"id": 22, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8797808885574341, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}], "body": [{"label": "list_item", "id": 25, "page_no": 8, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 70.031, "t": 76.12599999999998, "r": 212.373, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7310384511947632, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "end object detection with transformers."}, {"label": "list_item", "id": 6, "page_no": 8, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 76.12599999999998, "r": 323.8, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9389600157737732, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[16]"}, {"label": "list_item", "id": 9, "page_no": 8, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 54.595, "t": 120.274, "r": 65.05, "b": 127.971, "coord_origin": "TOPLEFT"}, "confidence": 0.9372755885124207, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[2]"}, {"label": "list_item", "id": 15, "page_no": 8, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 142.36599999999999, "r": 323.8, "b": 150.063, "coord_origin": "TOPLEFT"}, "confidence": 0.9253129959106445, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[17]"}, {"label": "list_item", "id": 7, "page_no": 8, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 54.595, "t": 153.46400000000006, "r": 65.05, "b": 161.16099999999994, "coord_origin": "TOPLEFT"}, "confidence": 0.9378374218940735, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[3]"}, {"label": "list_item", "id": 12, "page_no": 8, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 308.862, "t": 175.72900000000004, "r": 323.8, "b": 183.42600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9299732446670532, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[18]"}, {"label": "list_item", "id": 0, "page_no": 8, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 54.595, "t": 186.65300000000002, "r": 65.05, "b": 194.35000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9648825526237488, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[4]"}, {"label": "list_item", "id": 1, "page_no": 8, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 54.595, "t": 230.80200000000002, "r": 65.05, "b": 238.49900000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9620943069458008, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[5]"}, {"label": "list_item", "id": 8, "page_no": 8, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 308.862, "t": 263.88699999999994, "r": 323.8, "b": 271.58399999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.937321662902832, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[19]"}, {"label": "list_item", "id": 2, "page_no": 8, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 54.595, "t": 274.95000000000005, "r": 65.05, "b": 282.647, "coord_origin": "TOPLEFT"}, "confidence": 0.9555517435073853, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[6]"}, {"label": "list_item", "id": 4, "page_no": 8, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 54.595, "t": 319.099, "r": 65.05, "b": 326.796, "coord_origin": "TOPLEFT"}, "confidence": 0.9479843378067017, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[7]"}, {"label": "list_item", "id": 18, "page_no": 8, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 330.127, "r": 323.8, "b": 337.824, "coord_origin": "TOPLEFT"}, "confidence": 0.9027292728424072, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[20]"}, {"label": "list_item", "id": 3, "page_no": 8, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 54.595, "t": 352.288, "r": 65.05, "b": 359.985, "coord_origin": "TOPLEFT"}, "confidence": 0.9484425187110901, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[8]"}, {"label": "list_item", "id": 21, "page_no": 8, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 374.449, "r": 323.8, "b": 382.146, "coord_origin": "TOPLEFT"}, "confidence": 0.882714569568634, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[21]"}, {"label": "list_item", "id": 10, "page_no": 8, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 54.595, "t": 407.395, "r": 65.05, "b": 415.092, "coord_origin": "TOPLEFT"}, "confidence": 0.9330756664276123, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[9]"}, {"label": "list_item", "id": 14, "page_no": 8, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 50.112, "t": 440.585, "r": 65.05, "b": 448.282, "coord_origin": "TOPLEFT"}, "confidence": 0.9274735450744629, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[10]"}, {"label": "list_item", "id": 20, "page_no": 8, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 308.862, "t": 440.689, "r": 323.8, "b": 448.386, "coord_origin": "TOPLEFT"}, "confidence": 0.8896440863609314, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[22]"}, {"label": "list_item", "id": 11, "page_no": 8, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 484.733, "r": 65.05, "b": 492.43, "coord_origin": "TOPLEFT"}, "confidence": 0.9299950003623962, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[11]"}, {"label": "list_item", "id": 5, "page_no": 8, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 539.841, "r": 65.05, "b": 547.538, "coord_origin": "TOPLEFT"}, "confidence": 0.9394103288650513, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[12]"}, {"label": "list_item", "id": 19, "page_no": 8, "cluster": {"id": 19, "label": "list_item", "bbox": {"l": 308.862, "t": 561.7239999999999, "r": 323.8, "b": 569.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9025435447692871, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[23]"}, {"label": "list_item", "id": 13, "page_no": 8, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 594.948, "r": 65.05, "b": 602.645, "coord_origin": "TOPLEFT"}, "confidence": 0.9298838973045349, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[13]"}, {"label": "list_item", "id": 23, "page_no": 8, "cluster": {"id": 23, "label": "list_item", "bbox": {"l": 308.862, "t": 627.9639999999999, "r": 323.8, "b": 635.6610000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.8777532577514648, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[24]"}, {"label": "list_item", "id": 17, "page_no": 8, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 50.112, "t": 650.056, "r": 65.05, "b": 657.7529999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9115257263183594, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[14]"}, {"label": "list_item", "id": 24, "page_no": 8, "cluster": {"id": 24, "label": "list_item", "bbox": {"l": 308.862, "t": 672.2860000000001, "r": 323.8, "b": 679.983, "coord_origin": "TOPLEFT"}, "confidence": 0.8654531240463257, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[25]"}, {"label": "list_item", "id": 16, "page_no": 8, "cluster": {"id": 16, "label": "list_item", "bbox": {"l": 50.112, "t": 683.245, "r": 65.05, "b": 690.942, "coord_origin": "TOPLEFT"}, "confidence": 0.912230372428894, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[15]"}], "headers": [{"label": "page_footer", "id": 22, "page_no": 8, "cluster": {"id": 22, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8797808885574341, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}]}}, {"page_no": 9, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.579, "r_y0": 83.82299999999998, "r_x1": 225.821, "r_y1": 83.82299999999998, "r_x2": 225.821, "r_y2": 76.12599999999998, "r_x3": 223.579, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.183, "r_y0": 83.82299999999998, "r_x1": 286.362, "r_y1": 83.82299999999998, "r_x2": 286.362, "r_y2": 76.12599999999998, "r_x3": 229.183, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "pages 658-666,", "orig": "pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 97.917, "r_y1": 94.78200000000004, "r_x2": 97.917, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 106.10500000000002, "r_x1": 286.359, "r_y1": 106.10500000000002, "r_x2": 286.359, "r_y2": 98.40800000000002, "r_x3": 70.035, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 117.06399999999996, "r_x1": 286.363, "r_y1": 117.06399999999996, "r_x2": 286.363, "r_y2": 109.36699999999996, "r_x3": 70.031, "r_y3": 109.36699999999996, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 128.02300000000002, "r_x1": 286.363, "r_y1": 128.02300000000002, "r_x2": 286.363, "r_y2": 120.32600000000002, "r_x3": 70.031, "r_y3": 120.32600000000002, "coord_origin": "TOPLEFT"}, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.98199999999997, "r_x1": 77.5, "r_y1": 138.98199999999997, "r_x2": 77.5, "r_y2": 131.28499999999997, "r_x3": 70.031, "r_y3": 131.28499999999997, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.56, "r_y0": 138.85299999999995, "r_x1": 286.366, "r_y1": 138.85299999999995, "r_x2": 286.366, "r_y2": 131.12300000000005, "r_x3": 80.56, "r_y3": 131.12300000000005, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.812, "r_x1": 195.229, "r_y1": 149.812, "r_x2": 195.229, "r_y2": 142.082, "r_x3": 70.031, "r_y3": 142.082, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.231, "r_y0": 149.94100000000003, "r_x1": 286.365, "r_y1": 149.94100000000003, "r_x2": 286.365, "r_y2": 142.24400000000003, "r_x3": 195.231, "r_y3": 142.24400000000003, "coord_origin": "TOPLEFT"}, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 160.89999999999998, "r_x1": 120.333, "r_y1": 160.89999999999998, "r_x2": 120.333, "r_y2": 153.20299999999997, "r_x3": 70.031, "r_y3": 153.20299999999997, "coord_origin": "TOPLEFT"}, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 172.22400000000005, "r_x1": 286.359, "r_y1": 172.22400000000005, "r_x2": 286.359, "r_y2": 164.52700000000004, "r_x3": 70.035, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.183, "r_x1": 158.395, "r_y1": 183.183, "r_x2": 158.395, "r_y2": 175.486, "r_x3": 70.031, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed.", "orig": "gel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.035, "r_y0": 183.183, "r_x1": 202.877, "r_y1": 183.183, "r_x2": 202.877, "r_y2": 175.486, "r_x3": 164.035, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deepdesrt:", "orig": "Deepdesrt:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.163, "r_y0": 183.183, "r_x1": 286.363, "r_y1": 183.183, "r_x2": 286.363, "r_y2": 175.486, "r_x3": 207.163, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deep learning for de-", "orig": "Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 194.14200000000005, "r_x1": 286.363, "r_y1": 194.14200000000005, "r_x2": 286.363, "r_y2": 186.44500000000005, "r_x3": 70.031, "r_y3": 186.44500000000005, "coord_origin": "TOPLEFT"}, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.101, "r_x1": 88.206, "r_y1": 205.101, "r_x2": 88.206, "r_y2": 197.404, "r_x3": 70.031, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "ages.", "orig": "ages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.864, "r_y0": 205.101, "r_x1": 101.333, "r_y1": 205.101, "r_x2": 101.333, "r_y2": 197.404, "r_x3": 93.864, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.331, "r_y0": 204.97199999999998, "r_x1": 286.358, "r_y1": 204.97199999999998, "r_x2": 286.358, "r_y2": 197.24199999999996, "r_x3": 104.331, "r_y3": 197.24199999999996, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 215.92999999999995, "r_x1": 220.487, "r_y1": 215.92999999999995, "r_x2": 220.487, "r_y2": 208.20000000000005, "r_x3": 70.031, "r_y3": 208.20000000000005, "coord_origin": "TOPLEFT"}, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.484, "r_y0": 216.05899999999997, "r_x1": 222.726, "r_y1": 216.05899999999997, "r_x2": 222.726, "r_y2": 208.36199999999997, "r_x3": 220.484, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 225.909, "r_y0": 216.05899999999997, "r_x1": 286.36, "r_y1": 216.05899999999997, "r_x2": 286.36, "r_y2": 208.36199999999997, "r_x3": 225.909, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": "volume 1, pages", "orig": "volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.01800000000003, "r_x1": 166.653, "r_y1": 227.01800000000003, "r_x2": 166.653, "r_y2": 219.32100000000003, "r_x3": 70.031, "r_y3": 219.32100000000003, "coord_origin": "TOPLEFT"}, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.34199999999998, "r_x1": 179.147, "r_y1": 238.34199999999998, "r_x2": 179.147, "r_y2": 230.64499999999998, "r_x3": 70.035, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Faisal Shafait and Ray Smith.", "orig": "Faisal Shafait and Ray Smith.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.366, "r_y0": 238.34199999999998, "r_x1": 286.359, "r_y1": 238.34199999999998, "r_x2": 286.359, "r_y2": 230.64499999999998, "r_x3": 184.366, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Table detection in heteroge-", "orig": "Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.30100000000004, "r_x1": 134.804, "r_y1": 249.30100000000004, "r_x2": 134.804, "r_y2": 241.60400000000004, "r_x3": 70.031, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "neous documents.", "orig": "neous documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.7, "r_y0": 249.30100000000004, "r_x1": 147.169, "r_y1": 249.30100000000004, "r_x2": 147.169, "r_y2": 241.60400000000004, "r_x3": 139.7, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.933, "r_y0": 249.17200000000003, "r_x1": 286.366, "r_y1": 249.17200000000003, "r_x2": 286.366, "r_y2": 241.442, "r_x3": 149.933, "r_y3": 241.442, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.131, "r_x1": 244.688, "r_y1": 260.131, "r_x2": 244.688, "r_y2": 252.40099999999995, "r_x3": 70.031, "r_y3": 252.40099999999995, "coord_origin": "TOPLEFT"}, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.691, "r_y0": 260.26, "r_x1": 246.933, "r_y1": 260.26, "r_x2": 246.933, "r_y2": 252.563, "r_x3": 244.691, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.775, "r_y0": 260.26, "r_x1": 286.358, "r_y1": 260.26, "r_x2": 286.358, "r_y2": 252.563, "r_x3": 249.775, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": "pages 65-", "orig": "pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.21900000000005, "r_x1": 111.366, "r_y1": 271.21900000000005, "r_x2": 111.366, "r_y2": 263.52200000000005, "r_x3": 70.031, "r_y3": 263.52200000000005, "coord_origin": "TOPLEFT"}, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.543, "r_x1": 94.944, "r_y1": 282.543, "r_x2": 94.944, "r_y2": 274.846, "r_x3": 70.035, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.871, "r_y0": 282.543, "r_x1": 127.268, "r_y1": 282.543, "r_x2": 127.268, "r_y2": 274.846, "r_x3": 100.871, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.195, "r_y0": 282.543, "r_x1": 165.832, "r_y1": 282.543, "r_x2": 165.832, "r_y2": 274.846, "r_x3": 133.195, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.683, "r_y0": 282.543, "r_x1": 194.094, "r_y1": 282.543, "r_x2": 194.094, "r_y2": 274.846, "r_x3": 172.683, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.021, "r_y0": 282.543, "r_x1": 211.48, "r_y1": 282.543, "r_x2": 211.48, "r_y2": 274.846, "r_x3": 200.021, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.407, "r_y0": 282.543, "r_x1": 239.438, "r_y1": 282.543, "r_x2": 239.438, "r_y2": 274.846, "r_x3": 217.407, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.288, "r_y0": 282.543, "r_x1": 264.221, "r_y1": 282.543, "r_x2": 264.221, "r_y2": 274.846, "r_x3": 246.288, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.147, "r_y0": 282.543, "r_x1": 286.359, "r_y1": 282.543, "r_x2": 286.359, "r_y2": 274.846, "r_x3": 270.147, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.502, "r_x1": 85.964, "r_y1": 293.502, "r_x2": 85.964, "r_y2": 285.805, "r_x3": 70.031, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "seen", "orig": "seen", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.021, "r_y0": 293.502, "r_x1": 108.945, "r_y1": 293.502, "r_x2": 108.945, "r_y2": 285.805, "r_x3": 91.021, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Raza", "orig": "Raza", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.002, "r_y0": 293.502, "r_x1": 135.674, "r_y1": 293.502, "r_x2": 135.674, "r_y2": 285.805, "r_x3": 114.002, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Rizvi,", "orig": "Rizvi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.43, "r_y0": 293.502, "r_x1": 171.306, "r_y1": 293.502, "r_x2": 171.306, "r_y2": 285.805, "r_x3": 141.43, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Andreas", "orig": "Andreas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.364, "r_y0": 293.502, "r_x1": 204.5, "r_y1": 293.502, "r_x2": 204.5, "r_y2": 285.805, "r_x3": 176.364, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dengel,", "orig": "Dengel,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.265, "r_y0": 293.502, "r_x1": 223.213, "r_y1": 293.502, "r_x2": 223.213, "r_y2": 285.805, "r_x3": 210.265, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.27, "r_y0": 293.502, "r_x1": 252.668, "r_y1": 293.502, "r_x2": 252.668, "r_y2": 285.805, "r_x3": 228.27, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Sheraz", "orig": "Sheraz", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.725, "r_y0": 293.502, "r_x1": 286.363, "r_y1": 293.502, "r_x2": 286.363, "r_y2": 285.805, "r_x3": 257.725, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ahmed.", "orig": "Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.461, "r_x1": 286.363, "r_y1": 304.461, "r_x2": 286.363, "r_y2": 296.764, "r_x3": 70.031, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.42, "r_x1": 77.5, "r_y1": 315.42, "r_x2": 77.5, "r_y2": 307.723, "r_x3": 70.031, "r_y3": 307.723, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.35, "r_y0": 315.291, "r_x1": 286.366, "r_y1": 315.291, "r_x2": 286.366, "r_y2": 307.561, "r_x3": 79.35, "r_y3": 307.561, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 326.249, "r_x1": 147.572, "r_y1": 326.249, "r_x2": 147.572, "r_y2": 318.519, "r_x3": 70.031, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.572, "r_y0": 326.378, "r_x1": 271.335, "r_y1": 326.378, "r_x2": 271.335, "r_y2": 318.681, "r_x3": 147.572, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 337.702, "r_x1": 286.359, "r_y1": 337.702, "r_x2": 286.359, "r_y2": 330.005, "r_x3": 70.035, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.661, "r_x1": 286.363, "r_y1": 348.661, "r_x2": 286.363, "r_y2": 340.964, "r_x3": 70.031, "r_y3": 340.964, "coord_origin": "TOPLEFT"}, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 359.62, "r_x1": 198.824, "r_y1": 359.62, "r_x2": 198.824, "r_y2": 351.923, "r_x3": 70.031, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.06, "r_y0": 359.62, "r_x1": 213.529, "r_y1": 359.62, "r_x2": 213.529, "r_y2": 351.923, "r_x3": 206.06, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.021, "r_y0": 359.491, "r_x1": 286.358, "r_y1": 359.491, "r_x2": 286.358, "r_y2": 351.761, "r_x3": 217.021, "r_y3": 351.761, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.031, "r_y3": 362.72, "coord_origin": "TOPLEFT"}, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.078, "r_y0": 370.579, "r_x1": 145.32, "r_y1": 370.579, "r_x2": 145.32, "r_y2": 362.882, "r_x3": 143.078, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.108, "r_y0": 370.579, "r_x1": 286.361, "r_y1": 370.579, "r_x2": 286.361, "r_y2": 362.882, "r_x3": 148.108, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": "KDD '18, pages 774-782, New York,", "orig": "KDD '18, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.538, "r_x1": 161.157, "r_y1": 381.538, "r_x2": 161.157, "r_y2": 373.841, "r_x3": 70.031, "r_y3": 373.841, "coord_origin": "TOPLEFT"}, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 392.862, "r_x1": 286.359, "r_y1": 392.862, "r_x2": 286.359, "r_y2": 385.165, "r_x3": 70.035, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 84.225, "r_y1": 403.821, "r_x2": 84.225, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "reit,", "orig": "reit,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.489, "r_y0": 403.821, "r_x1": 286.363, "r_y1": 403.821, "r_x2": 286.363, "r_y2": 396.124, "r_x3": 87.489, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 414.78, "r_x1": 78.997, "r_y1": 414.78, "r_x2": 78.997, "r_y2": 407.083, "r_x3": 70.031, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "lia", "orig": "lia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.871, "r_y0": 414.78, "r_x1": 125.47, "r_y1": 414.78, "r_x2": 125.47, "r_y2": 407.083, "r_x3": 82.871, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Polosukhin.", "orig": "Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.908, "r_y0": 414.78, "r_x1": 167.783, "r_y1": 414.78, "r_x2": 167.783, "r_y2": 407.083, "r_x3": 133.908, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.656, "r_y0": 414.78, "r_x1": 177.637, "r_y1": 414.78, "r_x2": 177.637, "r_y2": 407.083, "r_x3": 171.656, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.51, "r_y0": 414.78, "r_x1": 190.477, "r_y1": 414.78, "r_x2": 190.477, "r_y2": 407.083, "r_x3": 181.51, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.341, "r_y0": 414.78, "r_x1": 230.834, "r_y1": 414.78, "r_x2": 230.834, "r_y2": 407.083, "r_x3": 194.341, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "you need.", "orig": "you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.272, "r_y0": 414.78, "r_x1": 246.741, "r_y1": 414.78, "r_x2": 246.741, "r_y2": 407.083, "r_x3": 239.272, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.614, "r_y0": 414.78, "r_x1": 255.842, "r_y1": 414.78, "r_x2": 255.842, "r_y2": 407.083, "r_x3": 250.614, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "I.", "orig": "I.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.715, "r_y0": 414.78, "r_x1": 286.363, "r_y1": 414.78, "r_x2": 286.363, "r_y2": 407.083, "r_x3": 259.715, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Guyon,", "orig": "Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 425.739, "r_x1": 286.363, "r_y1": 425.739, "r_x2": 286.363, "r_y2": 418.042, "r_x3": 70.031, "r_y3": 418.042, "coord_origin": "TOPLEFT"}, "text": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.697, "r_x1": 196.762, "r_y1": 436.697, "r_x2": 196.762, "r_y2": 429.0, "r_x3": 70.031, "r_y3": 429.0, "coord_origin": "TOPLEFT"}, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.202, "r_y0": 436.568, "r_x1": 286.36, "r_y1": 436.568, "r_x2": 286.36, "r_y2": 428.838, "r_x3": 200.202, "r_y3": 428.838, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 447.527, "r_x1": 189.194, "r_y1": 447.527, "r_x2": 189.194, "r_y2": 439.797, "r_x3": 70.031, "r_y3": 439.797, "coord_origin": "TOPLEFT"}, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.195, "r_y0": 447.656, "r_x1": 191.437, "r_y1": 447.656, "r_x2": 191.437, "r_y2": 439.959, "r_x3": 189.195, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.795, "r_y0": 447.656, "r_x1": 286.364, "r_y1": 447.656, "r_x2": 286.364, "r_y2": 439.959, "r_x3": 193.795, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": "pages 5998-6008. Curran", "orig": "pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 458.615, "r_x1": 158.924, "r_y1": 458.615, "r_x2": 158.924, "r_y2": 450.918, "r_x3": 70.031, "r_y3": 450.918, "coord_origin": "TOPLEFT"}, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 469.939, "r_x1": 88.963, "r_y1": 469.939, "r_x2": 88.963, "r_y2": 462.242, "r_x3": 70.035, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Oriol", "orig": "Oriol", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.81, "r_y0": 469.939, "r_x1": 122.274, "r_y1": 469.939, "r_x2": 122.274, "r_y2": 462.242, "r_x3": 92.81, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Vinyals,", "orig": "Vinyals,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.524, "r_y0": 469.939, "r_x1": 194.695, "r_y1": 469.939, "r_x2": 194.695, "r_y2": 462.242, "r_x3": 126.524, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Alexander Toshev,", "orig": "Alexander Toshev,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.954, "r_y0": 469.939, "r_x1": 286.359, "r_y1": 469.939, "r_x2": 286.359, "r_y2": 462.242, "r_x3": 198.954, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Samy Bengio, and Du-", "orig": "Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 480.898, "r_x1": 116.28, "r_y1": 480.898, "r_x2": 116.28, "r_y2": 473.201, "r_x3": 70.031, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.484, "r_y0": 480.898, "r_x1": 175.924, "r_y1": 480.898, "r_x2": 175.924, "r_y2": 473.201, "r_x3": 122.484, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "Show and tell:", "orig": "Show and tell:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.56, "r_y0": 480.898, "r_x1": 286.363, "r_y1": 480.898, "r_x2": 286.363, "r_y2": 473.201, "r_x3": 180.56, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "A neural image caption gen-", "orig": "A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 491.857, "r_x1": 103.305, "r_y1": 491.857, "r_x2": 103.305, "r_y2": 484.16, "r_x3": 70.031, "r_y3": 484.16, "coord_origin": "TOPLEFT"}, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.516, "r_y0": 491.728, "r_x1": 286.359, "r_y1": 491.728, "r_x2": 286.359, "r_y2": 483.998, "r_x3": 105.516, "r_y3": 483.998, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 502.687, "r_x1": 212.516, "r_y1": 502.687, "r_x2": 212.516, "r_y2": 494.957, "r_x3": 70.031, "r_y3": 494.957, "coord_origin": "TOPLEFT"}, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.514, "r_y0": 502.816, "r_x1": 263.56, "r_y1": 502.816, "r_x2": 263.56, "r_y2": 495.119, "r_x3": 212.514, "r_y3": 495.119, "coord_origin": "TOPLEFT"}, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 514.14, "r_x1": 247.373, "r_y1": 514.14, "r_x2": 247.373, "r_y2": 506.443, "r_x3": 70.035, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.972, "r_y0": 514.14, "r_x1": 286.359, "r_y1": 514.14, "r_x2": 286.359, "r_y2": 506.443, "r_x3": 253.972, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.0989999999999, "r_x1": 253.125, "r_y1": 525.0989999999999, "r_x2": 253.125, "r_y2": 517.402, "r_x3": 70.031, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "reconstruct syntactic structures from table images.", "orig": "reconstruct syntactic structures from table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.155, "r_y0": 525.0989999999999, "r_x1": 265.624, "r_y1": 525.0989999999999, "r_x2": 265.624, "r_y2": 517.402, "r_x3": 258.155, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.429, "r_y0": 524.97, "r_x1": 286.362, "r_y1": 524.97, "r_x2": 286.362, "r_y2": 517.24, "r_x3": 268.429, "r_y3": 517.24, "coord_origin": "TOPLEFT"}, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 535.929, "r_x1": 286.363, "r_y1": 535.929, "r_x2": 286.363, "r_y2": 528.1990000000001, "r_x3": 70.031, "r_y3": 528.1990000000001, "coord_origin": "TOPLEFT"}, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 546.887, "r_x1": 125.255, "r_y1": 546.887, "r_x2": 125.255, "r_y2": 539.157, "r_x3": 70.031, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.254, "r_y0": 547.016, "r_x1": 240.051, "r_y1": 547.016, "r_x2": 240.051, "r_y2": 539.319, "r_x3": 125.254, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 558.34, "r_x1": 125.008, "r_y1": 558.34, "r_x2": 125.008, "r_y2": 550.643, "r_x3": 70.035, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue,", "orig": "Wenyuan Xue,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.823, "r_y0": 558.34, "r_x1": 181.676, "r_y1": 558.34, "r_x2": 181.676, "r_y2": 550.643, "r_x3": 129.823, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Baosheng Yu,", "orig": "Baosheng Yu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.491, "r_y0": 558.34, "r_x1": 286.359, "r_y1": 558.34, "r_x2": 286.359, "r_y2": 550.643, "r_x3": 186.491, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wen Wang, Dacheng Tao,", "orig": "Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.299, "r_x1": 137.082, "r_y1": 569.299, "r_x2": 137.082, "r_y2": 561.602, "r_x3": 70.031, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.985, "r_y0": 569.299, "r_x1": 172.382, "r_y1": 569.299, "r_x2": 172.382, "r_y2": 561.602, "r_x3": 145.985, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.704, "r_y0": 569.299, "r_x1": 206.625, "r_y1": 569.299, "r_x2": 206.625, "r_y2": 561.602, "r_x3": 178.704, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "A table", "orig": "A table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 569.299, "r_x1": 286.363, "r_y1": 569.299, "r_x2": 286.363, "r_y2": 561.602, "r_x3": 210.633, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "graph reconstruction", "orig": "graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.258, "r_x1": 99.324, "r_y1": 580.258, "r_x2": 99.324, "r_y2": 572.561, "r_x3": 70.031, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.157, "r_y0": 580.258, "r_x1": 114.612, "r_y1": 580.258, "r_x2": 114.612, "r_y2": 572.561, "r_x3": 104.157, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.454, "r_y0": 580.258, "r_x1": 136.884, "r_y1": 580.258, "r_x2": 136.884, "r_y2": 572.561, "r_x3": 119.454, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.717, "r_y0": 580.258, "r_x1": 173.091, "r_y1": 580.258, "r_x2": 173.091, "r_y2": 572.561, "r_x3": 141.717, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.933, "r_y0": 580.258, "r_x1": 221.007, "r_y1": 580.258, "r_x2": 221.007, "r_y2": 572.561, "r_x3": 177.933, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.543, "r_y0": 580.129, "r_x1": 252.466, "r_y1": 580.129, "r_x2": 252.466, "r_y2": 572.399, "r_x3": 232.543, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "arXiv", "orig": "arXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.299, "r_y0": 580.129, "r_x1": 286.359, "r_y1": 580.129, "r_x2": 286.359, "r_y2": 572.399, "r_x3": 257.299, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "preprint", "orig": "preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.088, "r_x1": 135.531, "r_y1": 591.088, "r_x2": 135.531, "r_y2": 583.358, "r_x3": 70.031, "r_y3": 583.358, "coord_origin": "TOPLEFT"}, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.53, "r_y0": 591.217, "r_x1": 167.899, "r_y1": 591.217, "r_x2": 167.899, "r_y2": 583.52, "r_x3": 135.53, "r_y3": 583.52, "coord_origin": "TOPLEFT"}, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.5409999999999, "r_x1": 286.359, "r_y1": 602.5409999999999, "r_x2": 286.359, "r_y2": 594.844, "r_x3": 70.035, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.5, "r_x1": 109.107, "r_y1": 613.5, "r_x2": 109.107, "r_y2": 605.803, "r_x3": 70.031, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.226, "r_y0": 613.5, "r_x1": 271.766, "r_y1": 613.5, "r_x2": 271.766, "r_y2": 605.803, "r_x3": 116.226, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 613.5, "r_x1": 286.363, "r_y1": 613.5, "r_x2": 286.363, "r_y2": 605.803, "r_x3": 278.894, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.33, "r_x1": 286.363, "r_y1": 624.33, "r_x2": 286.363, "r_y2": 616.6, "r_x3": 70.031, "r_y3": 616.6, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.289, "r_x1": 139.099, "r_y1": 635.289, "r_x2": 139.099, "r_y2": 627.559, "r_x3": 70.031, "r_y3": 627.559, "coord_origin": "TOPLEFT"}, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.098, "r_y0": 635.418, "r_x1": 238.957, "r_y1": 635.418, "r_x2": 238.957, "r_y2": 627.721, "r_x3": 139.098, "r_y3": 627.721, "coord_origin": "TOPLEFT"}, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 646.742, "r_x1": 286.359, "r_y1": 646.742, "r_x2": 286.359, "r_y2": 639.045, "r_x3": 70.035, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 657.7, "r_x1": 286.363, "r_y1": 657.7, "r_x2": 286.363, "r_y2": 650.0029999999999, "r_x3": 70.031, "r_y3": 650.0029999999999, "coord_origin": "TOPLEFT"}, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.659, "r_x1": 286.363, "r_y1": 668.659, "r_x2": 286.363, "r_y2": 660.962, "r_x3": 70.031, "r_y3": 660.962, "coord_origin": "TOPLEFT"}, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.6179999999999, "r_x1": 158.458, "r_y1": 679.6179999999999, "r_x2": 158.458, "r_y2": 671.921, "r_x3": 70.031, "r_y3": 671.921, "coord_origin": "TOPLEFT"}, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.528, "r_y0": 679.489, "r_x1": 286.362, "r_y1": 679.489, "r_x2": 286.362, "r_y2": 671.759, "r_x3": 160.528, "r_y3": 671.759, "coord_origin": "TOPLEFT"}, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 690.448, "r_x1": 171.423, "r_y1": 690.448, "r_x2": 171.423, "r_y2": 682.718, "r_x3": 70.031, "r_y3": 682.718, "coord_origin": "TOPLEFT"}, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.422, "r_y0": 690.577, "r_x1": 212.757, "r_y1": 690.577, "r_x2": 212.757, "r_y2": 682.88, "r_x3": 171.422, "r_y3": 682.88, "coord_origin": "TOPLEFT"}, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 701.901, "r_x1": 80.992, "r_y1": 701.901, "r_x2": 80.992, "r_y2": 694.204, "r_x3": 70.035, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.062, "r_y0": 701.901, "r_x1": 114.715, "r_y1": 701.901, "r_x2": 114.715, "r_y2": 694.204, "r_x3": 89.062, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.246, "r_y0": 701.901, "r_x1": 149.146, "r_y1": 701.901, "r_x2": 149.146, "r_y2": 694.204, "r_x3": 124.246, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.225, "r_y0": 701.901, "r_x1": 209.373, "r_y1": 701.901, "r_x2": 209.373, "r_y2": 694.204, "r_x3": 157.225, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.904, "r_y0": 701.901, "r_x1": 231.852, "r_y1": 701.901, "r_x2": 231.852, "r_y2": 694.204, "r_x3": 218.904, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.931, "r_y0": 701.901, "r_x1": 269.323, "r_y1": 701.901, "r_x2": 269.323, "r_y2": 694.204, "r_x3": 239.931, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 277.392, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 277.392, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 116.719, "r_y1": 712.86, "r_x2": 116.719, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "meno Yepes.", "orig": "meno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.413, "r_y0": 712.86, "r_x1": 235.013, "r_y1": 712.86, "r_x2": 235.013, "r_y2": 705.163, "r_x3": 122.413, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Image-based table recognition:", "orig": "Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.335, "r_y0": 712.86, "r_x1": 286.363, "r_y1": 712.86, "r_x2": 286.363, "r_y2": 705.163, "r_x3": 239.335, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Data, model,", "orig": "Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.56, "r_y0": 83.82299999999998, "r_x1": 545.113, "r_y1": 83.82299999999998, "r_x2": 545.113, "r_y2": 76.12599999999998, "r_x3": 388.56, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 472.306, "r_y1": 94.78099999999995, "r_x2": 472.306, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.885, "r_y0": 94.65200000000004, "r_x1": 545.115, "r_y1": 94.65200000000004, "r_x2": 545.115, "r_y2": 86.92200000000003, "r_x3": 475.885, "r_y3": 86.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.61099999999999, "r_x1": 371.927, "r_y1": 105.61099999999999, "r_x2": 371.927, "r_y2": 97.88099999999997, "r_x3": 328.781, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.926, "r_y0": 105.74000000000001, "r_x1": 374.168, "r_y1": 105.74000000000001, "r_x2": 374.168, "r_y2": 98.043, "r_x3": 371.926, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.472, "r_y0": 105.74000000000001, "r_x1": 545.112, "r_y1": 105.74000000000001, "r_x2": 545.112, "r_y2": 98.043, "r_x3": 376.472, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "pages 564-580, Cham, 2020. Springer Interna-", "orig": "pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 417.701, "r_y1": 116.69899999999996, "r_x2": 417.701, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 128.654, "r_x1": 523.15, "r_y1": 128.654, "r_x2": 523.15, "r_y2": 120.957, "r_x3": 328.785, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.171, "r_y0": 128.654, "r_x1": 545.109, "r_y1": 128.654, "r_x2": 545.109, "r_y2": 120.957, "r_x3": 528.171, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Pub-", "orig": "Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 139.61300000000006, "r_x1": 545.113, "r_y1": 139.61300000000006, "r_x2": 545.113, "r_y2": 131.91600000000005, "r_x3": 328.781, "r_y3": 131.91600000000005, "coord_origin": "TOPLEFT"}, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 150.44299999999998, "r_x1": 545.113, "r_y1": 150.44299999999998, "r_x2": 545.113, "r_y2": 142.71299999999997, "r_x3": 328.781, "r_y3": 142.71299999999997, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.40200000000004, "r_x1": 406.322, "r_y1": 161.40200000000004, "r_x2": 406.322, "r_y2": 153.67200000000003, "r_x3": 328.781, "r_y3": 153.67200000000003, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 161.53099999999995, "r_x1": 506.181, "r_y1": 161.53099999999995, "r_x2": 506.181, "r_y2": 153.83399999999995, "r_x3": 406.322, "r_y3": 153.83399999999995, "coord_origin": "TOPLEFT"}, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 15, "label": "text", "bbox": {"l": 70.031, "t": 75.96400000000006, "r": 223.581, "b": 83.69399999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.6886764168739319, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "list_item", "bbox": {"l": 328.781, "t": 76.12599999999998, "r": 383.646, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7556979060173035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 98.40800000000002, "r": 65.05, "b": 106.10500000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.7723011374473572, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 120.957, "r": 323.8, "b": 128.654, "coord_origin": "TOPLEFT"}, "confidence": 0.8375797271728516, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 164.52700000000004, "r": 65.05, "b": 172.22400000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8580600619316101, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 50.112, "t": 230.64499999999998, "r": 65.05, "b": 238.34199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.8512731194496155, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 274.846, "r": 65.05, "b": 282.543, "coord_origin": "TOPLEFT"}, "confidence": 0.8494512438774109, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 50.112, "t": 330.005, "r": 65.05, "b": 337.702, "coord_origin": "TOPLEFT"}, "confidence": 0.8567671179771423, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "list_item", "bbox": {"l": 50.112, "t": 385.165, "r": 65.05, "b": 392.862, "coord_origin": "TOPLEFT"}, "confidence": 0.8832162618637085, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 50.112, "t": 462.242, "r": 65.05, "b": 469.939, "coord_origin": "TOPLEFT"}, "confidence": 0.8431925177574158, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 50.112, "t": 506.443, "r": 65.05, "b": 514.14, "coord_origin": "TOPLEFT"}, "confidence": 0.8405635952949524, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 550.643, "r": 65.05, "b": 558.34, "coord_origin": "TOPLEFT"}, "confidence": 0.8241521716117859, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 594.844, "r": 65.05, "b": 602.5409999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.8360886573791504, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "list_item", "bbox": {"l": 50.112, "t": 639.045, "r": 65.05, "b": 646.742, "coord_origin": "TOPLEFT"}, "confidence": 0.8079474568367004, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 694.204, "r": 65.05, "b": 701.901, "coord_origin": "TOPLEFT"}, "confidence": 0.8385783433914185, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "page_footer", "bbox": {"l": 292.63, "t": 734.402, "r": 302.593, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9069584012031555, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 15, "page_no": 9, "cluster": {"id": 15, "label": "text", "bbox": {"l": 70.031, "t": 75.96400000000006, "r": 223.581, "b": 83.69399999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.6886764168739319, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Computer Vision and Pattern Recognition"}, {"label": "list_item", "id": 14, "page_no": 9, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 328.781, "t": 76.12599999999998, "r": 383.646, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7556979060173035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "and evaluation."}, {"label": "list_item", "id": 13, "page_no": 9, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 98.40800000000002, "r": 65.05, "b": 106.10500000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.7723011374473572, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[26]"}, {"label": "list_item", "id": 9, "page_no": 9, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 120.957, "r": 323.8, "b": 128.654, "coord_origin": "TOPLEFT"}, "confidence": 0.8375797271728516, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[38]"}, {"label": "list_item", "id": 2, "page_no": 9, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 164.52700000000004, "r": 65.05, "b": 172.22400000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8580600619316101, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[27]"}, {"label": "list_item", "id": 4, "page_no": 9, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 50.112, "t": 230.64499999999998, "r": 65.05, "b": 238.34199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.8512731194496155, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[28]"}, {"label": "list_item", "id": 5, "page_no": 9, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 274.846, "r": 65.05, "b": 282.543, "coord_origin": "TOPLEFT"}, "confidence": 0.8494512438774109, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[29]"}, {"label": "list_item", "id": 3, "page_no": 9, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 50.112, "t": 330.005, "r": 65.05, "b": 337.702, "coord_origin": "TOPLEFT"}, "confidence": 0.8567671179771423, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[30]"}, {"label": "list_item", "id": 1, "page_no": 9, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 50.112, "t": 385.165, "r": 65.05, "b": 392.862, "coord_origin": "TOPLEFT"}, "confidence": 0.8832162618637085, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[31]"}, {"label": "list_item", "id": 6, "page_no": 9, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 50.112, "t": 462.242, "r": 65.05, "b": 469.939, "coord_origin": "TOPLEFT"}, "confidence": 0.8431925177574158, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[32]"}, {"label": "list_item", "id": 7, "page_no": 9, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 50.112, "t": 506.443, "r": 65.05, "b": 514.14, "coord_origin": "TOPLEFT"}, "confidence": 0.8405635952949524, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[33]"}, {"label": "list_item", "id": 11, "page_no": 9, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 550.643, "r": 65.05, "b": 558.34, "coord_origin": "TOPLEFT"}, "confidence": 0.8241521716117859, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[34]"}, {"label": "list_item", "id": 10, "page_no": 9, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 594.844, "r": 65.05, "b": 602.5409999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.8360886573791504, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[35]"}, {"label": "list_item", "id": 12, "page_no": 9, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 50.112, "t": 639.045, "r": 65.05, "b": 646.742, "coord_origin": "TOPLEFT"}, "confidence": 0.8079474568367004, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[36]"}, {"label": "list_item", "id": 8, "page_no": 9, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 694.204, "r": 65.05, "b": 701.901, "coord_origin": "TOPLEFT"}, "confidence": 0.8385783433914185, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[37]"}, {"label": "page_footer", "id": 0, "page_no": 9, "cluster": {"id": 0, "label": "page_footer", "bbox": {"l": 292.63, "t": 734.402, "r": 302.593, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9069584012031555, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10"}], "body": [{"label": "text", "id": 15, "page_no": 9, "cluster": {"id": 15, "label": "text", "bbox": {"l": 70.031, "t": 75.96400000000006, "r": 223.581, "b": 83.69399999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.6886764168739319, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Computer Vision and Pattern Recognition"}, {"label": "list_item", "id": 14, "page_no": 9, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 328.781, "t": 76.12599999999998, "r": 383.646, "b": 83.82299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7556979060173035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "and evaluation."}, {"label": "list_item", "id": 13, "page_no": 9, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 98.40800000000002, "r": 65.05, "b": 106.10500000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.7723011374473572, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[26]"}, {"label": "list_item", "id": 9, "page_no": 9, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 120.957, "r": 323.8, "b": 128.654, "coord_origin": "TOPLEFT"}, "confidence": 0.8375797271728516, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[38]"}, {"label": "list_item", "id": 2, "page_no": 9, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 164.52700000000004, "r": 65.05, "b": 172.22400000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8580600619316101, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[27]"}, {"label": "list_item", "id": 4, "page_no": 9, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 50.112, "t": 230.64499999999998, "r": 65.05, "b": 238.34199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.8512731194496155, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[28]"}, {"label": "list_item", "id": 5, "page_no": 9, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 274.846, "r": 65.05, "b": 282.543, "coord_origin": "TOPLEFT"}, "confidence": 0.8494512438774109, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[29]"}, {"label": "list_item", "id": 3, "page_no": 9, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 50.112, "t": 330.005, "r": 65.05, "b": 337.702, "coord_origin": "TOPLEFT"}, "confidence": 0.8567671179771423, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[30]"}, {"label": "list_item", "id": 1, "page_no": 9, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 50.112, "t": 385.165, "r": 65.05, "b": 392.862, "coord_origin": "TOPLEFT"}, "confidence": 0.8832162618637085, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[31]"}, {"label": "list_item", "id": 6, "page_no": 9, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 50.112, "t": 462.242, "r": 65.05, "b": 469.939, "coord_origin": "TOPLEFT"}, "confidence": 0.8431925177574158, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[32]"}, {"label": "list_item", "id": 7, "page_no": 9, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 50.112, "t": 506.443, "r": 65.05, "b": 514.14, "coord_origin": "TOPLEFT"}, "confidence": 0.8405635952949524, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[33]"}, {"label": "list_item", "id": 11, "page_no": 9, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 550.643, "r": 65.05, "b": 558.34, "coord_origin": "TOPLEFT"}, "confidence": 0.8241521716117859, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[34]"}, {"label": "list_item", "id": 10, "page_no": 9, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 594.844, "r": 65.05, "b": 602.5409999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.8360886573791504, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[35]"}, {"label": "list_item", "id": 12, "page_no": 9, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 50.112, "t": 639.045, "r": 65.05, "b": 646.742, "coord_origin": "TOPLEFT"}, "confidence": 0.8079474568367004, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[36]"}, {"label": "list_item", "id": 8, "page_no": 9, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 694.204, "r": 65.05, "b": 701.901, "coord_origin": "TOPLEFT"}, "confidence": 0.8385783433914185, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[37]"}], "headers": [{"label": "page_footer", "id": 0, "page_no": 9, "cluster": {"id": 0, "label": "page_footer", "bbox": {"l": 292.63, "t": 734.402, "r": 302.593, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9069584012031555, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10"}]}}, {"page_no": 10, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.184, "r_y0": 135.48400000000004, "r_x1": 375.043, "r_y1": 135.48400000000004, "r_x2": 375.043, "r_y2": 122.42399999999998, "r_x3": 220.184, "r_y3": 122.42399999999998, "coord_origin": "TOPLEFT"}, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 220.697, "r_x1": 286.365, "r_y1": 220.697, "r_x2": 286.365, "r_y2": 212.14499999999998, "r_x3": 50.112, "r_y3": 212.14499999999998, "coord_origin": "TOPLEFT"}, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 232.65200000000004, "r_x1": 286.365, "r_y1": 232.65200000000004, "r_x2": 286.365, "r_y2": 224.10000000000002, "r_x3": 50.112, "r_y3": 224.10000000000002, "coord_origin": "TOPLEFT"}, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 244.60699999999997, "r_x1": 286.365, "r_y1": 244.60699999999997, "r_x2": 286.365, "r_y2": 236.05499999999995, "r_x3": 50.112, "r_y3": 236.05499999999995, "coord_origin": "TOPLEFT"}, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 256.562, "r_x1": 286.365, "r_y1": 256.562, "r_x2": 286.365, "r_y2": 248.01, "r_x3": 50.112, "r_y3": 248.01, "coord_origin": "TOPLEFT"}, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 268.51700000000005, "r_x1": 286.365, "r_y1": 268.51700000000005, "r_x2": 286.365, "r_y2": 259.96500000000003, "r_x3": 50.112, "r_y3": 259.96500000000003, "coord_origin": "TOPLEFT"}, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 280.472, "r_x1": 286.365, "r_y1": 280.472, "r_x2": 286.365, "r_y2": 271.91999999999996, "r_x3": 50.112, "r_y3": 271.91999999999996, "coord_origin": "TOPLEFT"}, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 292.428, "r_x1": 286.365, "r_y1": 292.428, "r_x2": 286.365, "r_y2": 283.876, "r_x3": 50.112, "r_y3": 283.876, "coord_origin": "TOPLEFT"}, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 304.383, "r_x1": 286.365, "r_y1": 304.383, "r_x2": 286.365, "r_y2": 295.831, "r_x3": 50.112, "r_y3": 295.831, "coord_origin": "TOPLEFT"}, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 316.338, "r_x1": 118.834, "r_y1": 316.338, "r_x2": 118.834, "r_y2": 307.786, "r_x3": 50.112, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "or column spans.", "orig": "or column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.307, "r_y0": 316.338, "r_x1": 286.365, "r_y1": 316.338, "r_x2": 286.365, "r_y2": 307.786, "r_x3": 123.307, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "Therefore a strict HTML structure looks", "orig": "Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 328.293, "r_x1": 127.163, "r_y1": 328.293, "r_x2": 127.163, "r_y2": 319.741, "r_x3": 50.112, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "always rectangular.", "orig": "always rectangular.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.257, "r_y0": 328.293, "r_x1": 286.365, "r_y1": 328.293, "r_x2": 286.365, "r_y2": 319.741, "r_x3": 131.257, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "However, HTML is a lenient encoding", "orig": "However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 340.248, "r_x1": 95.163, "r_y1": 340.248, "r_x2": 95.163, "r_y2": 331.696, "r_x3": 50.112, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "format, i.e.", "orig": "format, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.459, "r_y0": 340.248, "r_x1": 286.365, "r_y1": 340.248, "r_x2": 286.365, "r_y2": 331.696, "r_x3": 101.459, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "tables with rows of different sizes might still", "orig": "tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 352.204, "r_x1": 257.942, "r_y1": 352.204, "r_x2": 257.942, "r_y2": 343.652, "r_x3": 50.112, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "be regarded as correct due to implicit display rules.", "orig": "be regarded as correct due to implicit display rules.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.574, "r_y0": 352.204, "r_x1": 286.365, "r_y1": 352.204, "r_x2": 286.365, "r_y2": 343.652, "r_x3": 262.574, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "These", "orig": "These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 364.159, "r_x1": 286.365, "r_y1": 364.159, "r_x2": 286.365, "r_y2": 355.607, "r_x3": 50.112, "r_y3": 355.607, "coord_origin": "TOPLEFT"}, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 376.114, "r_x1": 286.365, "r_y1": 376.114, "r_x2": 286.365, "r_y2": 367.562, "r_x3": 50.112, "r_y3": 367.562, "coord_origin": "TOPLEFT"}, "text": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "orig": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 388.069, "r_x1": 230.804, "r_y1": 388.069, "r_x2": 230.804, "r_y2": 379.517, "r_x3": 50.112, "r_y3": 379.517, "coord_origin": "TOPLEFT"}, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.726, "r_y0": 400.226, "r_x1": 248.477, "r_y1": 400.226, "r_x2": 248.477, "r_y2": 391.674, "r_x3": 240.726, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.96, "r_y0": 400.226, "r_x1": 277.458, "r_y1": 400.226, "r_x2": 277.458, "r_y2": 391.674, "r_x3": 252.96, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "derive", "orig": "derive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.942, "r_y0": 400.226, "r_x1": 286.365, "r_y1": 400.226, "r_x2": 286.365, "r_y2": 391.674, "r_x3": 281.942, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 412.181, "r_x1": 223.571, "r_y1": 412.181, "r_x2": 223.571, "r_y2": 403.629, "r_x3": 50.112, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "missing bounding box out of its neighbors.", "orig": "missing bounding box out of its neighbors.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.004, "r_y0": 412.181, "r_x1": 286.365, "r_y1": 412.181, "r_x2": 286.365, "r_y2": 403.629, "r_x3": 228.004, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "As a first step,", "orig": "As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 424.136, "r_x1": 286.365, "r_y1": 424.136, "r_x2": 286.365, "r_y2": 415.584, "r_x3": 50.112, "r_y3": 415.584, "coord_origin": "TOPLEFT"}, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 436.092, "r_x1": 189.519, "r_y1": 436.092, "r_x2": 189.519, "r_y2": 427.54, "r_x3": 50.112, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "grid that covers the table structure.", "orig": "grid that covers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 436.092, "r_x1": 286.365, "r_y1": 436.092, "r_x2": 286.365, "r_y2": 427.54, "r_x3": 193.414, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "In case of strict HTML", "orig": "In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.047, "r_x1": 286.365, "r_y1": 448.047, "r_x2": 286.365, "r_y2": 439.495, "r_x3": 50.112, "r_y3": 439.495, "coord_origin": "TOPLEFT"}, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.002, "r_x1": 286.365, "r_y1": 460.002, "r_x2": 286.365, "r_y2": 451.45, "r_x3": 50.112, "r_y3": 451.45, "coord_origin": "TOPLEFT"}, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 471.957, "r_x1": 286.365, "r_y1": 471.957, "r_x2": 286.365, "r_y2": 463.405, "r_x3": 50.112, "r_y3": 463.405, "coord_origin": "TOPLEFT"}, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 483.912, "r_x1": 143.76, "r_y1": 483.912, "r_x2": 143.76, "r_y2": 475.36, "r_x3": 50.112, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "for a rectangular table,", "orig": "for a rectangular table,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.696, "r_y0": 483.912, "r_x1": 153.235, "r_y1": 483.912, "r_x2": 153.235, "r_y2": 475.36, "r_x3": 147.696, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.881, "r_y0": 483.912, "r_x1": 163.526, "r_y1": 483.912, "r_x2": 163.526, "r_y2": 475.36, "r_x3": 156.881, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.173, "r_y0": 483.912, "r_x1": 286.365, "r_y1": 483.912, "r_x2": 286.365, "r_y2": 475.36, "r_x3": 167.173, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "possible to compute the geo-", "orig": "possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 495.867, "r_x1": 286.365, "r_y1": 495.867, "r_x2": 286.365, "r_y2": 487.315, "r_x3": 50.112, "r_y3": 487.315, "coord_origin": "TOPLEFT"}, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.823, "r_x1": 286.365, "r_y1": 507.823, "r_x2": 286.365, "r_y2": 499.271, "r_x3": 50.112, "r_y3": 499.271, "coord_origin": "TOPLEFT"}, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.778, "r_x1": 286.365, "r_y1": 519.778, "r_x2": 286.365, "r_y2": 511.226, "r_x3": 50.112, "r_y3": 511.226, "coord_origin": "TOPLEFT"}, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.733, "r_x1": 286.365, "r_y1": 531.733, "r_x2": 286.365, "r_y2": 523.181, "r_x3": 50.112, "r_y3": 523.181, "coord_origin": "TOPLEFT"}, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.688, "r_x1": 286.365, "r_y1": 543.688, "r_x2": 286.365, "r_y2": 535.136, "r_x3": 50.112, "r_y3": 535.136, "coord_origin": "TOPLEFT"}, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.643, "r_x1": 286.365, "r_y1": 555.643, "r_x2": 286.365, "r_y2": 547.091, "r_x3": 50.112, "r_y3": 547.091, "coord_origin": "TOPLEFT"}, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.5989999999999, "r_x1": 257.474, "r_y1": 567.5989999999999, "r_x2": 257.474, "r_y2": 559.047, "r_x3": 50.112, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.949, "r_y0": 567.5989999999999, "r_x1": 286.365, "r_y1": 567.5989999999999, "r_x2": 286.365, "r_y2": 559.047, "r_x3": 263.949, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.554, "r_x1": 242.251, "r_y1": 579.554, "r_x2": 242.251, "r_y2": 571.002, "r_x3": 50.112, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "we have decided to simply discard those tables.", "orig": "we have decided to simply discard those tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.714, "r_y0": 579.554, "r_x1": 286.365, "r_y1": 579.554, "r_x2": 286.365, "r_y2": 571.002, "r_x3": 246.714, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "In case of", "orig": "In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.509, "r_x1": 286.365, "r_y1": 591.509, "r_x2": 286.365, "r_y2": 582.957, "r_x3": 50.112, "r_y3": 582.957, "coord_origin": "TOPLEFT"}, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.4639999999999, "r_x1": 286.365, "r_y1": 603.4639999999999, "r_x2": 286.365, "r_y2": 594.912, "r_x3": 50.112, "r_y3": 594.912, "coord_origin": "TOPLEFT"}, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.419, "r_x1": 286.365, "r_y1": 615.419, "r_x2": 286.365, "r_y2": 606.867, "r_x3": 50.112, "r_y3": 606.867, "coord_origin": "TOPLEFT"}, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.374, "r_x1": 242.261, "r_y1": 627.374, "r_x2": 242.261, "r_y2": 618.822, "r_x3": 50.112, "r_y3": 618.822, "coord_origin": "TOPLEFT"}, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 651.487, "r_x1": 179.905, "r_y1": 651.487, "r_x2": 179.905, "r_y2": 642.935, "r_x3": 50.112, "r_y3": 642.935, "coord_origin": "TOPLEFT"}, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 702.107, "r_x1": 286.365, "r_y1": 702.107, "r_x2": 286.365, "r_y2": 693.5550000000001, "r_x3": 50.112, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 714.062, "r_x1": 84.144, "r_y1": 714.062, "r_x2": 84.144, "r_y2": 705.51, "r_x3": 50.112, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.238, "r_y0": 714.062, "r_x1": 286.365, "r_y1": 714.062, "r_x2": 286.365, "r_y2": 705.51, "r_x3": 91.238, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.043, "r_y0": 171.476, "r_x1": 468.393, "r_y1": 171.476, "r_x2": 468.393, "r_y2": 162.92399999999998, "r_x3": 431.043, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "structure,", "orig": "structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 472.508, "r_y0": 171.476, "r_x1": 491.327, "r_y1": 171.476, "r_x2": 491.327, "r_y2": 162.92399999999998, "r_x3": 472.508, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.113, "r_y0": 171.476, "r_x1": 545.115, "r_y1": 171.476, "r_x2": 545.115, "r_y2": 162.92399999999998, "r_x3": 495.113, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "and content.", "orig": "and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.43100000000004, "r_x1": 545.115, "r_y1": 183.43100000000004, "r_x2": 545.115, "r_y2": 174.87900000000002, "r_x3": 308.862, "r_y3": 174.87900000000002, "coord_origin": "TOPLEFT"}, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 195.38599999999997, "r_x1": 545.115, "r_y1": 195.38599999999997, "r_x2": 545.115, "r_y2": 186.83399999999995, "r_x3": 308.862, "r_y3": 186.83399999999995, "coord_origin": "TOPLEFT"}, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 207.34199999999998, "r_x1": 484.074, "r_y1": 207.34199999999998, "r_x2": 484.074, "r_y2": 198.78999999999996, "r_x3": 308.862, "r_y3": 198.78999999999996, "coord_origin": "TOPLEFT"}, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.01099999999997, "r_x1": 448.089, "r_y1": 232.01099999999997, "r_x2": 448.089, "r_y2": 223.45899999999995, "r_x3": 308.862, "r_y3": 223.45899999999995, "coord_origin": "TOPLEFT"}, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.382, "r_y0": 244.726, "r_x1": 492.911, "r_y1": 244.726, "r_x2": 492.911, "r_y2": 236.17399999999998, "r_x3": 335.382, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "Prepare styling and content templates:", "orig": "Prepare styling and content templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.669, "r_y0": 244.726, "r_x1": 545.115, "r_y1": 244.726, "r_x2": 545.115, "r_y2": 236.17399999999998, "r_x3": 498.669, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "The styling", "orig": "The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.68100000000004, "r_x1": 545.115, "r_y1": 256.68100000000004, "r_x2": 545.115, "r_y2": 248.12900000000002, "r_x3": 308.862, "r_y3": 248.12900000000002, "coord_origin": "TOPLEFT"}, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.63599999999997, "r_x1": 481.733, "r_y1": 268.63599999999997, "r_x2": 481.733, "r_y2": 260.08399999999995, "r_x3": 308.862, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "groups of scope specific appearances (e.g.", "orig": "groups of scope specific appearances (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.119, "r_y0": 268.63599999999997, "r_x1": 545.115, "r_y1": 268.63599999999997, "r_x2": 545.115, "r_y2": 260.08399999999995, "r_x3": 488.119, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "financial data,", "orig": "financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.591, "r_x1": 393.385, "r_y1": 280.591, "r_x2": 393.385, "r_y2": 272.039, "r_x3": 308.862, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.119, "r_y0": 280.591, "r_x1": 545.115, "r_y1": 280.591, "r_x2": 545.115, "r_y2": 272.039, "r_x3": 400.119, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.546, "r_x1": 545.115, "r_y1": 292.546, "r_x2": 545.115, "r_y2": 283.994, "r_x3": 308.862, "r_y3": 283.994, "coord_origin": "TOPLEFT"}, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.502, "r_x1": 349.808, "r_y1": 304.502, "r_x2": 349.808, "r_y2": 295.95, "r_x3": 308.862, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "frequently", "orig": "frequently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.152, "r_y0": 304.502, "r_x1": 487.183, "r_y1": 304.502, "r_x2": 487.183, "r_y2": 295.95, "r_x3": 354.152, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "used terms out of non-synthetic", "orig": "used terms out of non-synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.526, "r_y0": 304.502, "r_x1": 523.068, "r_y1": 304.502, "r_x2": 523.068, "r_y2": 295.95, "r_x3": 491.526, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.412, "r_y0": 304.502, "r_x1": 545.115, "r_y1": 304.502, "r_x2": 545.115, "r_y2": 295.95, "r_x3": 527.412, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.457, "r_x1": 425.693, "r_y1": 316.457, "r_x2": 425.693, "r_y2": 307.905, "r_x3": 308.862, "r_y3": 307.905, "coord_origin": "TOPLEFT"}, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.692, "r_y0": 329.171, "r_x1": 435.377, "r_y1": 329.171, "r_x2": 435.377, "r_y2": 320.619, "r_x3": 332.692, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "Generate table structures:", "orig": "Generate table structures:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.342, "r_y0": 329.171, "r_x1": 545.115, "r_y1": 329.171, "r_x2": 545.115, "r_y2": 320.619, "r_x3": 439.342, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "The structure of each syn-", "orig": "The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 341.126, "r_x1": 545.115, "r_y1": 341.126, "r_x2": 545.115, "r_y2": 332.574, "r_x3": 308.862, "r_y3": 332.574, "coord_origin": "TOPLEFT"}, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 353.081, "r_x1": 341.519, "r_y1": 353.081, "r_x2": 341.519, "r_y2": 344.529, "r_x3": 308.862, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "tentially", "orig": "tentially", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.813, "r_y0": 353.081, "r_x1": 427.168, "r_y1": 353.081, "r_x2": 427.168, "r_y2": 344.529, "r_x3": 345.813, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "spans over multiple", "orig": "spans over multiple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.462, "r_y0": 353.081, "r_x1": 545.115, "r_y1": 353.081, "r_x2": 545.115, "r_y2": 344.529, "r_x3": 431.462, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "rows and a table body that", "orig": "rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 365.037, "r_x1": 545.115, "r_y1": 365.037, "r_x2": 545.115, "r_y2": 356.485, "r_x3": 308.862, "r_y3": 356.485, "coord_origin": "TOPLEFT"}, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.992, "r_x1": 545.115, "r_y1": 376.992, "r_x2": 545.115, "r_y2": 368.44, "r_x3": 308.862, "r_y3": 368.44, "coord_origin": "TOPLEFT"}, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.947, "r_x1": 348.334, "r_y1": 388.947, "r_x2": 348.334, "r_y2": 380.395, "r_x3": 308.862, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "boundary.", "orig": "boundary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.504, "r_y0": 388.947, "r_x1": 545.115, "r_y1": 388.947, "r_x2": 545.115, "r_y2": 380.395, "r_x3": 353.504, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "The table structure is described by the parame-", "orig": "The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.902, "r_x1": 326.018, "r_y1": 400.902, "r_x2": 326.018, "r_y2": 392.35, "r_x3": 308.862, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "ters:", "orig": "ters:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.909, "r_y0": 400.902, "r_x1": 545.115, "r_y1": 400.902, "r_x2": 545.115, "r_y2": 392.35, "r_x3": 330.909, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "Total number of table rows and columns, number of", "orig": "Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.857, "r_x1": 545.115, "r_y1": 412.857, "r_x2": 545.115, "r_y2": 404.305, "r_x3": 308.862, "r_y3": 404.305, "coord_origin": "TOPLEFT"}, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.812, "r_x1": 333.49, "r_y1": 424.812, "r_x2": 333.49, "r_y2": 416.26, "r_x3": 308.862, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "spans,", "orig": "spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.082, "r_y0": 424.812, "r_x1": 418.66, "r_y1": 424.812, "r_x2": 418.66, "r_y2": 416.26, "r_x3": 338.082, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "column only spans,", "orig": "column only spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.253, "r_y0": 424.812, "r_x1": 545.115, "r_y1": 424.812, "r_x2": 545.115, "r_y2": 416.26, "r_x3": 423.253, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "both row and column spans),", "orig": "both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.768, "r_x1": 545.115, "r_y1": 436.768, "r_x2": 545.115, "r_y2": 428.216, "r_x3": 308.862, "r_y3": 428.216, "coord_origin": "TOPLEFT"}, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.723, "r_x1": 345.943, "r_y1": 448.723, "r_x2": 345.943, "r_y2": 440.171, "r_x3": 308.862, "r_y3": 440.171, "coord_origin": "TOPLEFT"}, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.073, "r_y0": 461.294, "r_x1": 511.864, "r_y1": 461.294, "r_x2": 511.864, "r_y2": 452.706, "r_x3": 488.073, "r_y3": 452.706, "coord_origin": "TOPLEFT"}, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.863, "r_y0": 461.437, "r_x1": 545.108, "r_y1": 461.437, "r_x2": 545.108, "r_y2": 452.885, "r_x3": 511.863, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.392, "r_x1": 545.115, "r_y1": 473.392, "r_x2": 545.115, "r_y2": 464.84, "r_x3": 308.862, "r_y3": 464.84, "coord_origin": "TOPLEFT"}, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.348, "r_x1": 545.115, "r_y1": 485.348, "r_x2": 545.115, "r_y2": 476.796, "r_x3": 308.862, "r_y3": 476.796, "coord_origin": "TOPLEFT"}, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.303, "r_x1": 379.148, "r_y1": 497.303, "r_x2": 379.148, "r_y2": 488.751, "r_x3": 308.862, "r_y3": 488.751, "coord_origin": "TOPLEFT"}, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.217, "r_y0": 510.017, "r_x1": 434.082, "r_y1": 510.017, "r_x2": 434.082, "r_y2": 501.465, "r_x3": 334.217, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Apply styling templates:", "orig": "Apply styling templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.063, "r_y0": 510.017, "r_x1": 545.115, "r_y1": 510.017, "r_x2": 545.115, "r_y2": 501.465, "r_x3": 439.063, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Depending on the domain", "orig": "Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.972, "r_x1": 406.884, "r_y1": 521.972, "r_x2": 406.884, "r_y2": 513.4200000000001, "r_x3": 308.862, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "of the synthetic dataset,", "orig": "of the synthetic dataset,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.019, "r_y0": 521.972, "r_x1": 545.115, "r_y1": 521.972, "r_x2": 545.115, "r_y2": 513.4200000000001, "r_x3": 411.019, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "a set of styling templates is first", "orig": "a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.928, "r_x1": 384.299, "r_y1": 533.928, "r_x2": 384.299, "r_y2": 525.376, "r_x3": 308.862, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.253, "r_y0": 533.928, "r_x1": 545.115, "r_y1": 533.928, "r_x2": 545.115, "r_y2": 525.376, "r_x3": 391.253, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.883, "r_x1": 496.159, "r_y1": 545.883, "r_x2": 496.159, "r_y2": 537.331, "r_x3": 308.862, "r_y3": 537.331, "coord_origin": "TOPLEFT"}, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.402, "r_y0": 558.597, "r_x1": 450.371, "r_y1": 558.597, "r_x2": 450.371, "r_y2": 550.045, "r_x3": 335.402, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "Render the complete tables:", "orig": "Render the complete tables:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 456.139, "r_y0": 558.597, "r_x1": 545.115, "r_y1": 558.597, "r_x2": 545.115, "r_y2": 550.045, "r_x3": 456.139, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "The synthetic table is", "orig": "The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 570.552, "r_x1": 334.326, "r_y1": 570.552, "r_x2": 334.326, "r_y2": 562.0, "r_x3": 308.862, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "finally", "orig": "finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.983, "r_y0": 570.552, "r_x1": 545.115, "r_y1": 570.552, "r_x2": 545.115, "r_y2": 562.0, "r_x3": 337.983, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "rendered by a web browser engine to generate the", "orig": "rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 582.5070000000001, "r_x1": 545.115, "r_y1": 582.5070000000001, "r_x2": 545.115, "r_y2": 573.955, "r_x3": 308.862, "r_y3": 573.955, "coord_origin": "TOPLEFT"}, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 594.463, "r_x1": 545.115, "r_y1": 594.463, "r_x2": 545.115, "r_y2": 585.9110000000001, "r_x3": 308.862, "r_y3": 585.9110000000001, "coord_origin": "TOPLEFT"}, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 606.418, "r_x1": 341.23, "r_y1": 606.418, "r_x2": 341.23, "r_y2": 597.866, "r_x3": 308.862, "r_y3": 597.866, "coord_origin": "TOPLEFT"}, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.591, "r_y0": 633.039, "r_x1": 376.493, "r_y1": 633.039, "r_x2": 376.493, "r_y2": 622.2909999999999, "r_x3": 323.591, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "Prediction", "orig": "Prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.255, "r_y0": 633.039, "r_x1": 461.076, "r_y1": 633.039, "r_x2": 461.076, "r_y2": 622.2909999999999, "r_x3": 382.255, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "post-processing", "orig": "post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.826, "r_y0": 633.039, "r_x1": 481.794, "r_y1": 633.039, "r_x2": 481.794, "r_y2": 622.2909999999999, "r_x3": 466.826, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.556, "r_y0": 633.039, "r_x1": 545.109, "r_y1": 633.039, "r_x2": 545.109, "r_y2": 622.2909999999999, "r_x3": 487.556, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "PDF docu-", "orig": "PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 646.987, "r_x1": 357.341, "r_y1": 646.987, "r_x2": 357.341, "r_y2": 636.239, "r_x3": 326.795, "r_y3": 636.239, "coord_origin": "TOPLEFT"}, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 678.197, "r_x1": 545.115, "r_y1": 678.197, "r_x2": 545.115, "r_y2": 669.645, "r_x3": 308.862, "r_y3": 669.645, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 690.152, "r_x1": 545.115, "r_y1": 690.152, "r_x2": 545.115, "r_y2": 681.6, "r_x3": 308.862, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 702.107, "r_x1": 545.115, "r_y1": 702.107, "r_x2": 545.115, "r_y2": 693.5550000000001, "r_x3": 308.862, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 714.063, "r_x1": 371.427, "r_y1": 714.063, "r_x2": 371.427, "r_y2": 705.511, "r_x3": 308.862, "r_y3": 705.511, "coord_origin": "TOPLEFT"}, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 18, "label": "section_header", "bbox": {"l": 132.842, "t": 110.57500000000005, "r": 465.376, "b": 121.32299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.6497084498405457, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 161.16099999999994, "r": 175.964, "b": 171.909, "coord_origin": "TOPLEFT"}, "confidence": 0.9454860091209412, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 162.92399999999998, "r": 426.929, "b": 171.476, "coord_origin": "TOPLEFT"}, "confidence": 0.9596064686775208, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "section_header", "bbox": {"l": 50.112, "t": 180.97900000000004, "r": 150.364, "b": 190.83100000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9535645842552185, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 200.18899999999996, "r": 286.365, "b": 208.74099999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9864971041679382, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 320.817, "t": 211.50400000000002, "r": 545.115, "b": 220.05600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9261796474456787, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 320.817, "t": 236.17399999999998, "r": 328.289, "b": 244.726, "coord_origin": "TOPLEFT"}, "confidence": 0.9642952680587769, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 320.817, "t": 320.619, "r": 328.289, "b": 329.171, "coord_origin": "TOPLEFT"}, "confidence": 0.9699994921684265, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 391.674, "r": 236.243, "b": 400.226, "coord_origin": "TOPLEFT"}, "confidence": 0.9826022386550903, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 320.817, "t": 452.885, "r": 485.758, "b": 461.437, "coord_origin": "TOPLEFT"}, "confidence": 0.9568928480148315, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 320.817, "t": 501.465, "r": 328.289, "b": 510.017, "coord_origin": "TOPLEFT"}, "confidence": 0.9710659980773926, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 320.817, "t": 550.045, "r": 328.289, "b": 558.597, "coord_origin": "TOPLEFT"}, "confidence": 0.9778757095336914, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "section_header", "bbox": {"l": 308.862, "t": 622.2909999999999, "r": 317.828, "b": 633.039, "coord_origin": "TOPLEFT"}, "confidence": 0.954940915107727, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 62.067, "t": 630.979, "r": 286.365, "b": 639.531, "coord_origin": "TOPLEFT"}, "confidence": 0.9335853457450867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 657.69, "r": 545.115, "b": 666.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9829329252243042, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 662.39, "r": 153.608, "b": 672.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9515743255615234, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 681.6, "r": 286.365, "b": 690.152, "coord_origin": "TOPLEFT"}, "confidence": 0.9783332347869873, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8986663222312927, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "section_header", "id": 18, "page_no": 10, "cluster": {"id": 18, "label": "section_header", "bbox": {"l": 132.842, "t": 110.57500000000005, "r": 465.376, "b": 121.32299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.6497084498405457, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers"}, {"label": "section_header", "id": 13, "page_no": 10, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 161.16099999999994, "r": 175.964, "b": 171.909, "coord_origin": "TOPLEFT"}, "confidence": 0.9454860091209412, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Details on the datasets"}, {"label": "text", "id": 8, "page_no": 10, "cluster": {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 162.92399999999998, "r": 426.929, "b": 171.476, "coord_origin": "TOPLEFT"}, "confidence": 0.9596064686775208, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "ances in regard to their size,"}, {"label": "section_header", "id": 11, "page_no": 10, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 50.112, "t": 180.97900000000004, "r": 150.364, "b": 190.83100000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9535645842552185, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.1. Data preparation"}, {"label": "text", "id": 0, "page_no": 10, "cluster": {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 200.18899999999996, "r": 286.365, "b": 208.74099999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9864971041679382, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As a first step of our data preparation process, we have"}, {"label": "text", "id": 15, "page_no": 10, "cluster": {"id": 15, "label": "text", "bbox": {"l": 320.817, "t": 211.50400000000002, "r": 545.115, "b": 220.05600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9261796474456787, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The process of generating a synthetic dataset can be de-"}, {"label": "list_item", "id": 7, "page_no": 10, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 320.817, "t": 236.17399999999998, "r": 328.289, "b": 244.726, "coord_origin": "TOPLEFT"}, "confidence": 0.9642952680587769, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1."}, {"label": "list_item", "id": 6, "page_no": 10, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 320.817, "t": 320.619, "r": 328.289, "b": 329.171, "coord_origin": "TOPLEFT"}, "confidence": 0.9699994921684265, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2."}, {"label": "text", "id": 2, "page_no": 10, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 391.674, "r": 236.243, "b": 400.226, "coord_origin": "TOPLEFT"}, "confidence": 0.9826022386550903, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have developed a technique that tries"}, {"label": "list_item", "id": 9, "page_no": 10, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 320.817, "t": 452.885, "r": 485.758, "b": 461.437, "coord_origin": "TOPLEFT"}, "confidence": 0.9568928480148315, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Generate content: Based on the dataset"}, {"label": "list_item", "id": 5, "page_no": 10, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 320.817, "t": 501.465, "r": 328.289, "b": 510.017, "coord_origin": "TOPLEFT"}, "confidence": 0.9710659980773926, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4."}, {"label": "list_item", "id": 4, "page_no": 10, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 320.817, "t": 550.045, "r": 328.289, "b": 558.597, "coord_origin": "TOPLEFT"}, "confidence": 0.9778757095336914, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5."}, {"label": "section_header", "id": 10, "page_no": 10, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 308.862, "t": 622.2909999999999, "r": 317.828, "b": 633.039, "coord_origin": "TOPLEFT"}, "confidence": 0.954940915107727, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2."}, {"label": "text", "id": 14, "page_no": 10, "cluster": {"id": 14, "label": "text", "bbox": {"l": 62.067, "t": 630.979, "r": 286.365, "b": 639.531, "coord_origin": "TOPLEFT"}, "confidence": 0.9335853457450867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7 illustrates the distribution of the tables across"}, {"label": "text", "id": 1, "page_no": 10, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 657.69, "r": 545.115, "b": 666.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9829329252243042, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although TableFormer can predict the table structure and"}, {"label": "section_header", "id": 12, "page_no": 10, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 662.39, "r": 153.608, "b": 672.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9515743255615234, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.2. Synthetic datasets"}, {"label": "text", "id": 3, "page_no": 10, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 681.6, "r": 286.365, "b": 690.152, "coord_origin": "TOPLEFT"}, "confidence": 0.9783332347869873, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aiming to train and evaluate our models in a broader"}, {"label": "page_footer", "id": 16, "page_no": 10, "cluster": {"id": 16, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8986663222312927, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11"}], "body": [{"label": "section_header", "id": 18, "page_no": 10, "cluster": {"id": 18, "label": "section_header", "bbox": {"l": 132.842, "t": 110.57500000000005, "r": 465.376, "b": 121.32299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.6497084498405457, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers"}, {"label": "section_header", "id": 13, "page_no": 10, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 161.16099999999994, "r": 175.964, "b": 171.909, "coord_origin": "TOPLEFT"}, "confidence": 0.9454860091209412, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Details on the datasets"}, {"label": "text", "id": 8, "page_no": 10, "cluster": {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 162.92399999999998, "r": 426.929, "b": 171.476, "coord_origin": "TOPLEFT"}, "confidence": 0.9596064686775208, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "ances in regard to their size,"}, {"label": "section_header", "id": 11, "page_no": 10, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 50.112, "t": 180.97900000000004, "r": 150.364, "b": 190.83100000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9535645842552185, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.1. Data preparation"}, {"label": "text", "id": 0, "page_no": 10, "cluster": {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 200.18899999999996, "r": 286.365, "b": 208.74099999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9864971041679382, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As a first step of our data preparation process, we have"}, {"label": "text", "id": 15, "page_no": 10, "cluster": {"id": 15, "label": "text", "bbox": {"l": 320.817, "t": 211.50400000000002, "r": 545.115, "b": 220.05600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9261796474456787, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The process of generating a synthetic dataset can be de-"}, {"label": "list_item", "id": 7, "page_no": 10, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 320.817, "t": 236.17399999999998, "r": 328.289, "b": 244.726, "coord_origin": "TOPLEFT"}, "confidence": 0.9642952680587769, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1."}, {"label": "list_item", "id": 6, "page_no": 10, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 320.817, "t": 320.619, "r": 328.289, "b": 329.171, "coord_origin": "TOPLEFT"}, "confidence": 0.9699994921684265, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2."}, {"label": "text", "id": 2, "page_no": 10, "cluster": {"id": 2, "label": "text", "bbox": {"l": 62.067, "t": 391.674, "r": 236.243, "b": 400.226, "coord_origin": "TOPLEFT"}, "confidence": 0.9826022386550903, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have developed a technique that tries"}, {"label": "list_item", "id": 9, "page_no": 10, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 320.817, "t": 452.885, "r": 485.758, "b": 461.437, "coord_origin": "TOPLEFT"}, "confidence": 0.9568928480148315, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Generate content: Based on the dataset"}, {"label": "list_item", "id": 5, "page_no": 10, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 320.817, "t": 501.465, "r": 328.289, "b": 510.017, "coord_origin": "TOPLEFT"}, "confidence": 0.9710659980773926, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4."}, {"label": "list_item", "id": 4, "page_no": 10, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 320.817, "t": 550.045, "r": 328.289, "b": 558.597, "coord_origin": "TOPLEFT"}, "confidence": 0.9778757095336914, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5."}, {"label": "section_header", "id": 10, "page_no": 10, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 308.862, "t": 622.2909999999999, "r": 317.828, "b": 633.039, "coord_origin": "TOPLEFT"}, "confidence": 0.954940915107727, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2."}, {"label": "text", "id": 14, "page_no": 10, "cluster": {"id": 14, "label": "text", "bbox": {"l": 62.067, "t": 630.979, "r": 286.365, "b": 639.531, "coord_origin": "TOPLEFT"}, "confidence": 0.9335853457450867, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7 illustrates the distribution of the tables across"}, {"label": "text", "id": 1, "page_no": 10, "cluster": {"id": 1, "label": "text", "bbox": {"l": 320.817, "t": 657.69, "r": 545.115, "b": 666.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9829329252243042, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although TableFormer can predict the table structure and"}, {"label": "section_header", "id": 12, "page_no": 10, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 662.39, "r": 153.608, "b": 672.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9515743255615234, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.2. Synthetic datasets"}, {"label": "text", "id": 3, "page_no": 10, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 681.6, "r": 286.365, "b": 690.152, "coord_origin": "TOPLEFT"}, "confidence": 0.9783332347869873, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aiming to train and evaluate our models in a broader"}], "headers": [{"label": "page_footer", "id": 16, "page_no": 10, "cluster": {"id": 16, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8986663222312927, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11"}]}}, {"page_no": 11, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.832, "r_y0": 174.32299999999998, "r_x1": 545.114, "r_y1": 174.32299999999998, "r_x2": 545.114, "r_y2": 165.77099999999996, "r_x3": 92.832, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 186.27800000000002, "r_x1": 513.522, "r_y1": 186.27800000000002, "r_x2": 513.522, "r_y2": 177.726, "r_x3": 50.112, "r_y3": 177.726, "coord_origin": "TOPLEFT"}, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 219.75199999999995, "r_x1": 286.365, "r_y1": 219.75199999999995, "r_x2": 286.365, "r_y2": 211.20000000000005, "r_x3": 70.037, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 231.707, "r_x1": 87.472, "r_y1": 231.707, "r_x2": 87.472, "r_y2": 223.15499999999997, "r_x3": 70.037, "r_y3": 223.15499999999997, "coord_origin": "TOPLEFT"}, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 252.89200000000005, "r_x1": 286.365, "r_y1": 252.89200000000005, "r_x2": 286.365, "r_y2": 244.34000000000003, "r_x3": 70.037, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 264.847, "r_x1": 150.415, "r_y1": 264.847, "r_x2": 150.415, "r_y2": 256.29499999999996, "r_x3": 70.037, "r_y3": 256.29499999999996, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.979, "r_x1": 286.365, "r_y1": 299.979, "r_x2": 286.365, "r_y2": 291.427, "r_x3": 50.112, "r_y3": 291.427, "coord_origin": "TOPLEFT"}, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.934, "r_x1": 286.365, "r_y1": 311.934, "r_x2": 286.365, "r_y2": 303.382, "r_x3": 50.112, "r_y3": 303.382, "coord_origin": "TOPLEFT"}, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.889, "r_x1": 123.387, "r_y1": 323.889, "r_x2": 123.387, "r_y2": 315.337, "r_x3": 50.112, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "More specifically,", "orig": "More specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.348, "r_y0": 323.889, "r_x1": 286.365, "r_y1": 323.889, "r_x2": 286.365, "r_y2": 315.337, "r_x3": 128.348, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "PDF documents can be seen as a se-", "orig": "PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.845, "r_x1": 286.365, "r_y1": 335.845, "r_x2": 286.365, "r_y2": 327.293, "r_x3": 50.112, "r_y3": 327.293, "coord_origin": "TOPLEFT"}, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.8, "r_x1": 286.365, "r_y1": 347.8, "r_x2": 286.365, "r_y2": 339.248, "r_x3": 50.112, "r_y3": 339.248, "coord_origin": "TOPLEFT"}, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.755, "r_x1": 286.365, "r_y1": 359.755, "r_x2": 286.365, "r_y2": 351.203, "r_x3": 50.112, "r_y3": 351.203, "coord_origin": "TOPLEFT"}, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.71, "r_x1": 286.365, "r_y1": 371.71, "r_x2": 286.365, "r_y2": 363.158, "r_x3": 50.112, "r_y3": 363.158, "coord_origin": "TOPLEFT"}, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.665, "r_x1": 286.365, "r_y1": 383.665, "r_x2": 286.365, "r_y2": 375.113, "r_x3": 50.112, "r_y3": 375.113, "coord_origin": "TOPLEFT"}, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 395.621, "r_x1": 154.56, "r_y1": 395.621, "r_x2": 154.56, "r_y2": 387.069, "r_x3": 50.112, "r_y3": 387.069, "coord_origin": "TOPLEFT"}, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 419.846, "r_x1": 95.492, "r_y1": 419.846, "r_x2": 95.492, "r_y2": 411.294, "r_x3": 50.112, "r_y3": 411.294, "coord_origin": "TOPLEFT"}, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.071, "r_x1": 218.779, "r_y1": 444.071, "r_x2": 218.779, "r_y2": 435.519, "r_x3": 50.112, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "columns for the predicted table structure.", "orig": "columns for the predicted table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.796, "r_y0": 444.071, "r_x1": 286.365, "r_y1": 444.071, "r_x2": 286.365, "r_y2": 435.519, "r_x3": 224.796, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "This represents", "orig": "This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 456.026, "r_x1": 274.51, "r_y1": 456.026, "r_x2": 274.51, "r_y2": 447.474, "r_x3": 50.112, "r_y3": 447.474, "coord_origin": "TOPLEFT"}, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.429, "r_y0": 468.296, "r_x1": 286.365, "r_y1": 468.296, "r_x2": 286.365, "r_y2": 459.744, "r_x3": 77.429, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 480.251, "r_x1": 286.365, "r_y1": 480.251, "r_x2": 286.365, "r_y2": 471.699, "r_x3": 50.112, "r_y3": 471.699, "coord_origin": "TOPLEFT"}, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.206, "r_x1": 286.365, "r_y1": 492.206, "r_x2": 286.365, "r_y2": 483.654, "r_x3": 50.112, "r_y3": 483.654, "coord_origin": "TOPLEFT"}, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 504.161, "r_x1": 110.705, "r_y1": 504.161, "r_x2": 110.705, "r_y2": 495.609, "r_x3": 50.112, "r_y3": 495.609, "coord_origin": "TOPLEFT"}, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.248, "r_y0": 516.431, "r_x1": 286.365, "r_y1": 516.431, "r_x2": 286.365, "r_y2": 507.879, "r_x3": 75.248, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 528.387, "r_x1": 226.071, "r_y1": 528.387, "r_x2": 226.071, "r_y2": 519.835, "r_x3": 50.112, "r_y3": 519.835, "coord_origin": "TOPLEFT"}, "text": "the matches as 'good' ones and 'bad' ones.", "orig": "the matches as 'good' ones and 'bad' ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.587, "r_y0": 540.656, "r_x1": 286.365, "r_y1": 540.656, "r_x2": 286.365, "r_y2": 532.104, "r_x3": 80.587, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "If all IOU scores in a column are below the thresh-", "orig": "If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 552.612, "r_x1": 286.365, "r_y1": 552.612, "r_x2": 286.365, "r_y2": 544.06, "r_x3": 50.112, "r_y3": 544.06, "coord_origin": "TOPLEFT"}, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 564.567, "r_x1": 114.032, "r_y1": 564.567, "r_x2": 114.032, "r_y2": 556.015, "r_x3": 50.112, "r_y3": 556.015, "coord_origin": "TOPLEFT"}, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.732, "r_y0": 576.837, "r_x1": 286.365, "r_y1": 576.837, "r_x2": 286.365, "r_y2": 568.285, "r_x3": 76.732, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 588.792, "r_x1": 286.365, "r_y1": 588.792, "r_x2": 286.365, "r_y2": 580.24, "r_x3": 50.112, "r_y3": 580.24, "coord_origin": "TOPLEFT"}, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 600.7470000000001, "r_x1": 278.704, "r_y1": 600.7470000000001, "r_x2": 278.704, "r_y2": 592.1949999999999, "r_x3": 50.112, "r_y3": 592.1949999999999, "coord_origin": "TOPLEFT"}, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.715, "r_y0": 632.81, "r_x1": 203.496, "r_y1": 632.81, "r_x2": 203.496, "r_y2": 624.104, "r_x3": 160.715, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.585, "r_y0": 640.154, "r_x1": 189.145, "r_y1": 640.154, "r_x2": 189.145, "r_y2": 634.06, "r_x3": 185.585, "r_y3": 634.06, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.499, "r_y0": 632.668, "r_x1": 208.48, "r_y1": 632.668, "r_x2": 208.48, "r_y2": 624.104, "r_x3": 203.499, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.481, "r_y0": 632.81, "r_x1": 216.729, "r_y1": 632.81, "r_x2": 216.729, "r_y2": 624.104, "r_x3": 208.481, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 633.734, "r_x1": 220.289, "r_y1": 633.734, "r_x2": 220.289, "r_y2": 627.64, "r_x3": 216.729, "r_y3": 627.64, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 632.668, "r_x1": 225.768, "r_y1": 632.668, "r_x2": 225.768, "r_y2": 624.104, "r_x3": 220.787, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.705, "r_y0": 654.075, "r_x1": 118.953, "r_y1": 654.075, "r_x2": 118.953, "r_y2": 645.369, "r_x3": 110.705, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.953, "r_y0": 654.998, "r_x1": 122.513, "r_y1": 654.998, "r_x2": 122.513, "r_y2": 648.904, "r_x3": 118.953, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.779, "r_y0": 654.075, "r_x1": 133.528, "r_y1": 654.075, "r_x2": 133.528, "r_y2": 645.369, "r_x3": 125.779, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.295, "r_y0": 654.075, "r_x1": 166.678, "r_y1": 654.075, "r_x2": 166.678, "r_y2": 645.369, "r_x3": 136.295, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "max x", "orig": "max x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.003, "r_y0": 653.933, "r_x1": 160.984, "r_y1": 653.933, "r_x2": 160.984, "r_y2": 645.369, "r_x3": 156.003, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.678, "r_y0": 654.998, "r_x1": 170.238, "r_y1": 654.998, "r_x2": 170.238, "r_y2": 648.904, "r_x3": 166.678, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.736, "r_y0": 653.933, "r_x1": 185.678, "r_y1": 653.933, "r_x2": 185.678, "r_y2": 645.369, "r_x3": 170.736, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "} -", "orig": "} -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.894, "r_y0": 654.075, "r_x1": 216.729, "r_y1": 654.075, "r_x2": 216.729, "r_y2": 645.369, "r_x3": 187.894, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "min x", "orig": "min x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.054, "r_y0": 653.933, "r_x1": 211.035, "r_y1": 653.933, "r_x2": 211.035, "r_y2": 645.369, "r_x3": 206.054, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 654.998, "r_x1": 220.289, "r_y1": 654.998, "r_x2": 220.289, "r_y2": 648.904, "r_x3": 216.729, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 653.933, "r_x1": 225.768, "r_y1": 653.933, "r_x2": 225.768, "r_y2": 645.369, "r_x3": 220.787, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 643.706, "r_x1": 286.362, "r_y1": 643.706, "r_x2": 286.362, "r_y2": 635.154, "r_x3": 274.746, "r_y3": 635.154, "coord_origin": "TOPLEFT"}, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.336, "r_y0": 676.722, "r_x1": 82.648, "r_y1": 676.722, "r_x2": 82.648, "r_y2": 668.016, "r_x3": 78.336, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.533, "r_y0": 676.886, "r_x1": 93.178, "r_y1": 676.886, "r_x2": 93.178, "r_y2": 668.3340000000001, "r_x3": 86.533, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.063, "r_y0": 676.886, "r_x1": 123.634, "r_y1": 676.886, "r_x2": 123.634, "r_y2": 668.3340000000001, "r_x3": 97.063, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "one of", "orig": "one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.519, "r_y0": 676.58, "r_x1": 132.5, "r_y1": 676.58, "r_x2": 132.5, "r_y2": 668.016, "r_x3": 127.519, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.501, "r_y0": 676.886, "r_x1": 148.272, "r_y1": 676.886, "r_x2": 148.272, "r_y2": 668.3340000000001, "r_x3": 132.501, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "left,", "orig": "left,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.506, "r_y0": 676.886, "r_x1": 187.644, "r_y1": 676.886, "r_x2": 187.644, "r_y2": 668.3340000000001, "r_x3": 152.506, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "centroid,", "orig": "centroid,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.878, "r_y0": 676.886, "r_x1": 210.697, "r_y1": 676.886, "r_x2": 210.697, "r_y2": 668.3340000000001, "r_x3": 191.878, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "right", "orig": "right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.697, "r_y0": 676.58, "r_x1": 215.678, "r_y1": 676.58, "r_x2": 215.678, "r_y2": 668.016, "r_x3": 210.697, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.563, "r_y0": 676.886, "r_x1": 233.949, "r_y1": 676.886, "r_x2": 233.949, "r_y2": 668.3340000000001, "r_x3": 219.563, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.835, "r_y0": 676.722, "r_x1": 243.529, "r_y1": 676.722, "r_x2": 243.529, "r_y2": 668.016, "r_x3": 237.835, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.529, "r_y0": 677.645, "r_x1": 247.089, "r_y1": 677.645, "r_x2": 247.089, "r_y2": 671.551, "r_x3": 243.529, "r_y3": 671.551, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.473, "r_y0": 676.886, "r_x1": 258.118, "r_y1": 676.886, "r_x2": 258.118, "r_y2": 668.3340000000001, "r_x3": 251.473, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.003, "r_y0": 676.886, "r_x1": 286.362, "r_y1": 676.886, "r_x2": 286.362, "r_y2": 668.3340000000001, "r_x3": 262.003, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "the x-", "orig": "the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 688.841, "r_x1": 205.887, "r_y1": 688.841, "r_x2": 205.887, "r_y2": 680.289, "r_x3": 50.112, "r_y3": 680.289, "coord_origin": "TOPLEFT"}, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.274, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 76.274, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 94.605, "r_y1": 713.066, "r_x2": 94.605, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.599, "r_y0": 712.902, "r_x1": 103.293, "r_y1": 712.902, "r_x2": 103.293, "r_y2": 704.196, "r_x3": 97.599, "r_y3": 704.196, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.292, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 103.292, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.697, "r_y0": 219.75199999999995, "r_x1": 545.115, "r_y1": 219.75199999999995, "r_x2": 545.115, "r_y2": 211.20000000000005, "r_x3": 440.697, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "The usage of median dur-", "orig": "The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 231.70799999999997, "r_x1": 545.115, "r_y1": 231.70799999999997, "r_x2": 545.115, "r_y2": 223.15599999999995, "r_x3": 308.862, "r_y3": 223.15599999999995, "coord_origin": "TOPLEFT"}, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 243.663, "r_x1": 545.115, "r_y1": 243.663, "r_x2": 545.115, "r_y2": 235.111, "r_x3": 308.862, "r_y3": 235.111, "coord_origin": "TOPLEFT"}, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 255.61800000000005, "r_x1": 339.577, "r_y1": 255.61800000000005, "r_x2": 339.577, "r_y2": 247.06600000000003, "r_x3": 308.862, "r_y3": 247.06600000000003, "coord_origin": "TOPLEFT"}, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.884, "r_y0": 267.923, "r_x1": 545.115, "r_y1": 267.923, "r_x2": 545.115, "r_y2": 259.371, "r_x3": 334.884, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 279.87800000000004, "r_x1": 338.192, "r_y1": 279.87800000000004, "r_x2": 338.192, "r_y2": 271.326, "r_x3": 308.862, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.682, "r_y0": 279.71400000000006, "r_x1": 346.376, "r_y1": 279.71400000000006, "r_x2": 346.376, "r_y2": 271.00800000000004, "r_x3": 340.682, "r_y3": 271.00800000000004, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.376, "r_y0": 279.87800000000004, "r_x1": 453.723, "r_y1": 279.87800000000004, "r_x2": 453.723, "r_y2": 271.326, "r_x3": 346.376, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.144, "r_y0": 292.184, "r_x1": 545.115, "r_y1": 292.184, "r_x2": 545.115, "r_y2": 283.632, "r_x3": 332.144, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.139, "r_x1": 476.562, "r_y1": 304.139, "r_x2": 476.562, "r_y2": 295.587, "r_x3": 308.862, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "corrected bounding boxes and PDF cells.", "orig": "corrected bounding boxes and PDF cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.082, "r_y0": 304.139, "r_x1": 545.115, "r_y1": 304.139, "r_x2": 545.115, "r_y2": 295.587, "r_x3": 482.082, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "This time use a", "orig": "This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.094, "r_x1": 545.115, "r_y1": 316.094, "r_x2": 545.115, "r_y2": 307.542, "r_x3": 308.862, "r_y3": 307.542, "coord_origin": "TOPLEFT"}, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.049, "r_x1": 545.115, "r_y1": 328.049, "r_x2": 545.115, "r_y2": 319.497, "r_x3": 308.862, "r_y3": 319.497, "coord_origin": "TOPLEFT"}, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 340.005, "r_x1": 397.19, "r_y1": 340.005, "r_x2": 397.19, "r_y2": 331.453, "r_x3": 308.862, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.656, "r_y0": 340.005, "r_x1": 545.115, "r_y1": 340.005, "r_x2": 545.115, "r_y2": 331.453, "r_x3": 403.656, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 351.96, "r_x1": 545.115, "r_y1": 351.96, "r_x2": 545.115, "r_y2": 343.408, "r_x3": 308.862, "r_y3": 343.408, "coord_origin": "TOPLEFT"}, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 363.915, "r_x1": 357.26, "r_y1": 363.915, "r_x2": 357.26, "r_y2": 355.363, "r_x3": 308.862, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "is preferred.", "orig": "is preferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.176, "r_y0": 363.915, "r_x1": 545.115, "r_y1": 363.915, "r_x2": 545.115, "r_y2": 355.363, "r_x3": 361.176, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "This covers the cases where the PDF cells are", "orig": "This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 375.87, "r_x1": 545.115, "r_y1": 375.87, "r_x2": 545.115, "r_y2": 367.318, "r_x3": 308.862, "r_y3": 367.318, "coord_origin": "TOPLEFT"}, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 387.825, "r_x1": 329.614, "r_y1": 387.825, "r_x2": 329.614, "r_y2": 379.273, "r_x3": 308.862, "r_y3": 379.273, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.569, "r_y0": 400.131, "r_x1": 545.115, "r_y1": 400.131, "r_x2": 545.115, "r_y2": 391.579, "r_x3": 333.569, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.086, "r_x1": 545.115, "r_y1": 412.086, "r_x2": 545.115, "r_y2": 403.534, "r_x3": 308.862, "r_y3": 403.534, "coord_origin": "TOPLEFT"}, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.041, "r_x1": 545.115, "r_y1": 424.041, "r_x2": 545.115, "r_y2": 415.489, "r_x3": 308.862, "r_y3": 415.489, "coord_origin": "TOPLEFT"}, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.996, "r_x1": 488.109, "r_y1": 435.996, "r_x2": 488.109, "r_y2": 427.444, "r_x3": 308.862, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "columns pointing to the same PDF column.", "orig": "columns pointing to the same PDF column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.336, "r_y0": 435.996, "r_x1": 545.115, "r_y1": 435.996, "r_x2": 545.115, "r_y2": 427.444, "r_x3": 494.336, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "In such case", "orig": "In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.951, "r_x1": 545.115, "r_y1": 447.951, "r_x2": 545.115, "r_y2": 439.399, "r_x3": 308.862, "r_y3": 439.399, "coord_origin": "TOPLEFT"}, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.906, "r_x1": 426.182, "r_y1": 459.906, "r_x2": 426.182, "r_y2": 451.354, "r_x3": 308.862, "r_y3": 451.354, "coord_origin": "TOPLEFT"}, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.629, "r_y0": 472.212, "r_x1": 478.505, "r_y1": 472.212, "r_x2": 478.505, "r_y2": 463.66, "r_x3": 333.629, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "Pick up the remaining orphan cells.", "orig": "Pick up the remaining orphan cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.855, "r_y0": 472.212, "r_x1": 545.115, "r_y1": 472.212, "r_x2": 545.115, "r_y2": 463.66, "r_x3": 483.855, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "There could be", "orig": "There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.167, "r_x1": 545.115, "r_y1": 484.167, "r_x2": 545.115, "r_y2": 475.615, "r_x3": 308.862, "r_y3": 475.615, "coord_origin": "TOPLEFT"}, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.122, "r_x1": 545.115, "r_y1": 496.122, "r_x2": 545.115, "r_y2": 487.57, "r_x3": 308.862, "r_y3": 487.57, "coord_origin": "TOPLEFT"}, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.077, "r_x1": 381.898, "r_y1": 508.077, "r_x2": 381.898, "r_y2": 499.525, "r_x3": 308.862, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.702, "r_y0": 508.077, "r_x1": 545.115, "r_y1": 508.077, "r_x2": 545.115, "r_y2": 499.525, "r_x3": 388.702, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.033, "r_x1": 545.115, "r_y1": 520.033, "r_x2": 545.115, "r_y2": 511.481, "r_x3": 308.862, "r_y3": 511.481, "coord_origin": "TOPLEFT"}, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.988, "r_x1": 483.576, "r_y1": 531.988, "r_x2": 483.576, "r_y2": 523.4359999999999, "r_x3": 308.862, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box on the geometry of the grid.", "orig": "bounding box on the geometry of the grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.195, "r_y0": 531.988, "r_x1": 545.115, "r_y1": 531.988, "r_x2": 545.115, "r_y2": 523.4359999999999, "r_x3": 489.195, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "This mapping", "orig": "This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.943, "r_x1": 545.115, "r_y1": 543.943, "r_x2": 545.115, "r_y2": 535.3910000000001, "r_x3": 308.862, "r_y3": 535.3910000000001, "coord_origin": "TOPLEFT"}, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.898, "r_x1": 545.115, "r_y1": 555.898, "r_x2": 545.115, "r_y2": 547.346, "r_x3": 308.862, "r_y3": 547.346, "coord_origin": "TOPLEFT"}, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.8530000000001, "r_x1": 442.221, "r_y1": 567.8530000000001, "r_x2": 442.221, "r_y2": 559.3009999999999, "r_x3": 308.862, "r_y3": 559.3009999999999, "coord_origin": "TOPLEFT"}, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.943, "r_y0": 580.159, "r_x1": 545.115, "r_y1": 580.159, "r_x2": 545.115, "r_y2": 571.607, "r_x3": 337.943, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "Compute the top and bottom boundary of the hori-", "orig": "Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 592.114, "r_x1": 471.641, "r_y1": 592.114, "r_x2": 471.641, "r_y2": 583.562, "r_x3": 308.862, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.834, "r_y0": 591.95, "r_x1": 479.719, "r_y1": 591.95, "r_x2": 479.719, "r_y2": 583.244, "r_x3": 474.834, "r_y3": 583.244, "coord_origin": "TOPLEFT"}, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.269, "r_y0": 592.114, "r_x1": 545.117, "r_y1": 592.114, "r_x2": 545.117, "r_y2": 583.562, "r_x3": 483.269, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 604.069, "r_x1": 329.913, "r_y1": 604.069, "r_x2": 329.913, "r_y2": 595.517, "r_x3": 308.862, "r_y3": 595.517, "coord_origin": "TOPLEFT"}, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.925, "r_y0": 616.374, "r_x1": 374.226, "r_y1": 616.374, "r_x2": 374.226, "r_y2": 607.822, "r_x3": 339.925, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "Intersect", "orig": "Intersect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.042, "r_y0": 616.374, "r_x1": 545.115, "r_y1": 616.374, "r_x2": 545.115, "r_y2": 607.822, "r_x3": 378.042, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "the orphan's bounding box with the row", "orig": "the orphan's bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 628.33, "r_x1": 495.292, "r_y1": 628.33, "r_x2": 495.292, "r_y2": 619.778, "r_x3": 308.862, "r_y3": 619.778, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.534, "r_y0": 640.635, "r_x1": 545.115, "r_y1": 640.635, "r_x2": 545.115, "r_y2": 632.083, "r_x3": 337.534, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "Compute the left and right boundary of the vertical", "orig": "Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.59, "r_x1": 455.282, "r_y1": 652.59, "r_x2": 455.282, "r_y2": 644.038, "r_x3": 308.862, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.777, "r_y0": 652.4259999999999, "r_x1": 463.471, "r_y1": 652.4259999999999, "r_x2": 463.471, "r_y2": 643.72, "r_x3": 457.777, "r_y3": 643.72, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.971, "r_y0": 652.59, "r_x1": 545.114, "r_y1": 652.59, "r_x2": 545.114, "r_y2": 644.038, "r_x3": 465.971, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.545, "r_x1": 332.384, "r_y1": 664.545, "r_x2": 332.384, "r_y2": 655.9929999999999, "r_x3": 308.862, "r_y3": 655.9929999999999, "coord_origin": "TOPLEFT"}, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 688.806, "r_x1": 510.585, "r_y1": 688.806, "r_x2": 510.585, "r_y2": 680.254, "r_x3": 308.862, "r_y3": 680.254, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 1, "label": "caption", "bbox": {"l": 50.112, "t": 165.77099999999996, "r": 86.585, "b": 174.32299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9661495685577393, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 61.569, "t": 211.20000000000005, "r": 65.056, "b": 219.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9621952772140503, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 308.862, "t": 211.20000000000005, "r": 435.915, "b": 219.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8942298889160156, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 61.569, "t": 244.34000000000003, "r": 65.056, "b": 252.89200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9629555344581604, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 320.817, "t": 259.371, "r": 328.289, "b": 267.923, "coord_origin": "TOPLEFT"}, "confidence": 0.9423392415046692, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 279.472, "r": 286.365, "b": 288.024, "coord_origin": "TOPLEFT"}, "confidence": 0.9767085909843445, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 320.817, "t": 283.632, "r": 328.289, "b": 292.184, "coord_origin": "TOPLEFT"}, "confidence": 0.9562004804611206, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "list_item", "bbox": {"l": 320.817, "t": 391.579, "r": 328.289, "b": 400.131, "coord_origin": "TOPLEFT"}, "confidence": 0.8719939589500427, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 399.338, "r": 286.365, "b": 407.89, "coord_origin": "TOPLEFT"}, "confidence": 0.934766411781311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "list_item", "bbox": {"l": 62.067, "t": 423.564, "r": 286.365, "b": 432.116, "coord_origin": "TOPLEFT"}, "confidence": 0.8280702233314514, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 62.067, "t": 459.744, "r": 69.539, "b": 468.296, "coord_origin": "TOPLEFT"}, "confidence": 0.9646760821342468, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "list_item", "bbox": {"l": 320.817, "t": 463.66, "r": 328.289, "b": 472.212, "coord_origin": "TOPLEFT"}, "confidence": 0.9126082062721252, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 62.067, "t": 507.879, "r": 69.539, "b": 516.431, "coord_origin": "TOPLEFT"}, "confidence": 0.9391399025917053, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 62.067, "t": 532.104, "r": 76.453, "b": 540.656, "coord_origin": "TOPLEFT"}, "confidence": 0.9491708874702454, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 62.067, "t": 568.285, "r": 69.539, "b": 576.837, "coord_origin": "TOPLEFT"}, "confidence": 0.9587163329124451, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 320.817, "t": 571.607, "r": 332.712, "b": 580.159, "coord_origin": "TOPLEFT"}, "confidence": 0.8459473848342896, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "list_item", "bbox": {"l": 320.817, "t": 607.822, "r": 332.872, "b": 616.374, "coord_origin": "TOPLEFT"}, "confidence": 0.7716891169548035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "formula", "bbox": {"l": 112.028, "t": 624.104, "r": 157.952, "b": 632.81, "coord_origin": "TOPLEFT"}, "confidence": 0.9298412799835205, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 320.817, "t": 632.083, "r": 332.712, "b": 640.635, "coord_origin": "TOPLEFT"}, "confidence": 0.8584907054901123, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "list_item", "bbox": {"l": 320.817, "t": 668.299, "r": 545.115, "b": 676.851, "coord_origin": "TOPLEFT"}, "confidence": 0.7590745091438293, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 668.3340000000001, "r": 74.451, "b": 676.886, "coord_origin": "TOPLEFT"}, "confidence": 0.9545555114746094, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "list_item", "bbox": {"l": 62.067, "t": 692.559, "r": 69.539, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.9260510206222534, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "list_item", "bbox": {"l": 320.817, "t": 692.559, "r": 545.115, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.6971189975738525, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9126598238945007, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "picture", "bbox": {"l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT"}, "confidence": 0.6033818125724792, "cells": [], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 1, "page_no": 11, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 50.112, "t": 165.77099999999996, "r": 86.585, "b": 174.32299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9661495685577393, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7:"}, {"label": "list_item", "id": 4, "page_no": 11, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 61.569, "t": 211.20000000000005, "r": 65.056, "b": 219.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9621952772140503, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "text", "id": 16, "page_no": 11, "cluster": {"id": 16, "label": "text", "bbox": {"l": 308.862, "t": 211.20000000000005, "r": 435.915, "b": 219.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8942298889160156, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "dian cell size for all table cells."}, {"label": "list_item", "id": 3, "page_no": 11, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 61.569, "t": 244.34000000000003, "r": 65.056, "b": 252.89200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9629555344581604, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "list_item", "id": 9, "page_no": 11, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 320.817, "t": 259.371, "r": 328.289, "b": 267.923, "coord_origin": "TOPLEFT"}, "confidence": 0.9423392415046692, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6."}, {"label": "text", "id": 0, "page_no": 11, "cluster": {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 279.472, "r": 286.365, "b": 288.024, "coord_origin": "TOPLEFT"}, "confidence": 0.9767085909843445, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "However, it is possible to mitigate those limitations by"}, {"label": "list_item", "id": 6, "page_no": 11, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 320.817, "t": 283.632, "r": 328.289, "b": 292.184, "coord_origin": "TOPLEFT"}, "confidence": 0.9562004804611206, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7."}, {"label": "list_item", "id": 17, "page_no": 11, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 320.817, "t": 391.579, "r": 328.289, "b": 400.131, "coord_origin": "TOPLEFT"}, "confidence": 0.8719939589500427, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8."}, {"label": "text", "id": 11, "page_no": 11, "cluster": {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 399.338, "r": 286.365, "b": 407.89, "coord_origin": "TOPLEFT"}, "confidence": 0.934766411781311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Here is a step-by-step description of the prediction post-"}, {"label": "list_item", "id": 20, "page_no": 11, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 62.067, "t": 423.564, "r": 286.365, "b": 432.116, "coord_origin": "TOPLEFT"}, "confidence": 0.8280702233314514, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Get the minimal grid dimensions - number of rows and"}, {"label": "list_item", "id": 2, "page_no": 11, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 62.067, "t": 459.744, "r": 69.539, "b": 468.296, "coord_origin": "TOPLEFT"}, "confidence": 0.9646760821342468, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2."}, {"label": "list_item", "id": 15, "page_no": 11, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 320.817, "t": 463.66, "r": 328.289, "b": 472.212, "coord_origin": "TOPLEFT"}, "confidence": 0.9126082062721252, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9."}, {"label": "list_item", "id": 10, "page_no": 11, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 62.067, "t": 507.879, "r": 69.539, "b": 516.431, "coord_origin": "TOPLEFT"}, "confidence": 0.9391399025917053, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3."}, {"label": "list_item", "id": 8, "page_no": 11, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 62.067, "t": 532.104, "r": 76.453, "b": 540.656, "coord_origin": "TOPLEFT"}, "confidence": 0.9491708874702454, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3.a."}, {"label": "list_item", "id": 5, "page_no": 11, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 62.067, "t": 568.285, "r": 69.539, "b": 576.837, "coord_origin": "TOPLEFT"}, "confidence": 0.9587163329124451, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4."}, {"label": "text", "id": 19, "page_no": 11, "cluster": {"id": 19, "label": "text", "bbox": {"l": 320.817, "t": 571.607, "r": 332.712, "b": 580.159, "coord_origin": "TOPLEFT"}, "confidence": 0.8459473848342896, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9a."}, {"label": "list_item", "id": 21, "page_no": 11, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 320.817, "t": 607.822, "r": 332.872, "b": 616.374, "coord_origin": "TOPLEFT"}, "confidence": 0.7716891169548035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9b."}, {"label": "formula", "id": 12, "page_no": 11, "cluster": {"id": 12, "label": "formula", "bbox": {"l": 112.028, "t": 624.104, "r": 157.952, "b": 632.81, "coord_origin": "TOPLEFT"}, "confidence": 0.9298412799835205, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "alignment"}, {"label": "list_item", "id": 18, "page_no": 11, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 320.817, "t": 632.083, "r": 332.712, "b": 640.635, "coord_origin": "TOPLEFT"}, "confidence": 0.8584907054901123, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9c."}, {"label": "list_item", "id": 22, "page_no": 11, "cluster": {"id": 22, "label": "list_item", "bbox": {"l": 320.817, "t": 668.299, "r": 545.115, "b": 676.851, "coord_origin": "TOPLEFT"}, "confidence": 0.7590745091438293, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9d. Intersect the orphan's bounding box with the column"}, {"label": "text", "id": 7, "page_no": 11, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 668.3340000000001, "r": 74.451, "b": 676.886, "coord_origin": "TOPLEFT"}, "confidence": 0.9545555114746094, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where"}, {"label": "list_item", "id": 13, "page_no": 11, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 62.067, "t": 692.559, "r": 69.539, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.9260510206222534, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5."}, {"label": "list_item", "id": 25, "page_no": 11, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 320.817, "t": 692.559, "r": 545.115, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.6971189975738525, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9e. If the table cell under the identified row and column"}, {"label": "page_footer", "id": 14, "page_no": 11, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9126598238945007, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12"}, {"label": "picture", "id": 30, "page_no": 11, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT"}, "confidence": 0.6033818125724792, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 1, "page_no": 11, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 50.112, "t": 165.77099999999996, "r": 86.585, "b": 174.32299999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9661495685577393, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7:"}, {"label": "list_item", "id": 4, "page_no": 11, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 61.569, "t": 211.20000000000005, "r": 65.056, "b": 219.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9621952772140503, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "text", "id": 16, "page_no": 11, "cluster": {"id": 16, "label": "text", "bbox": {"l": 308.862, "t": 211.20000000000005, "r": 435.915, "b": 219.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8942298889160156, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "dian cell size for all table cells."}, {"label": "list_item", "id": 3, "page_no": 11, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 61.569, "t": 244.34000000000003, "r": 65.056, "b": 252.89200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9629555344581604, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2022"}, {"label": "list_item", "id": 9, "page_no": 11, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 320.817, "t": 259.371, "r": 328.289, "b": 267.923, "coord_origin": "TOPLEFT"}, "confidence": 0.9423392415046692, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6."}, {"label": "text", "id": 0, "page_no": 11, "cluster": {"id": 0, "label": "text", "bbox": {"l": 62.067, "t": 279.472, "r": 286.365, "b": 288.024, "coord_origin": "TOPLEFT"}, "confidence": 0.9767085909843445, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "However, it is possible to mitigate those limitations by"}, {"label": "list_item", "id": 6, "page_no": 11, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 320.817, "t": 283.632, "r": 328.289, "b": 292.184, "coord_origin": "TOPLEFT"}, "confidence": 0.9562004804611206, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7."}, {"label": "list_item", "id": 17, "page_no": 11, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 320.817, "t": 391.579, "r": 328.289, "b": 400.131, "coord_origin": "TOPLEFT"}, "confidence": 0.8719939589500427, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8."}, {"label": "text", "id": 11, "page_no": 11, "cluster": {"id": 11, "label": "text", "bbox": {"l": 62.067, "t": 399.338, "r": 286.365, "b": 407.89, "coord_origin": "TOPLEFT"}, "confidence": 0.934766411781311, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Here is a step-by-step description of the prediction post-"}, {"label": "list_item", "id": 20, "page_no": 11, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 62.067, "t": 423.564, "r": 286.365, "b": 432.116, "coord_origin": "TOPLEFT"}, "confidence": 0.8280702233314514, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Get the minimal grid dimensions - number of rows and"}, {"label": "list_item", "id": 2, "page_no": 11, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 62.067, "t": 459.744, "r": 69.539, "b": 468.296, "coord_origin": "TOPLEFT"}, "confidence": 0.9646760821342468, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2."}, {"label": "list_item", "id": 15, "page_no": 11, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 320.817, "t": 463.66, "r": 328.289, "b": 472.212, "coord_origin": "TOPLEFT"}, "confidence": 0.9126082062721252, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9."}, {"label": "list_item", "id": 10, "page_no": 11, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 62.067, "t": 507.879, "r": 69.539, "b": 516.431, "coord_origin": "TOPLEFT"}, "confidence": 0.9391399025917053, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3."}, {"label": "list_item", "id": 8, "page_no": 11, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 62.067, "t": 532.104, "r": 76.453, "b": 540.656, "coord_origin": "TOPLEFT"}, "confidence": 0.9491708874702454, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3.a."}, {"label": "list_item", "id": 5, "page_no": 11, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 62.067, "t": 568.285, "r": 69.539, "b": 576.837, "coord_origin": "TOPLEFT"}, "confidence": 0.9587163329124451, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4."}, {"label": "text", "id": 19, "page_no": 11, "cluster": {"id": 19, "label": "text", "bbox": {"l": 320.817, "t": 571.607, "r": 332.712, "b": 580.159, "coord_origin": "TOPLEFT"}, "confidence": 0.8459473848342896, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9a."}, {"label": "list_item", "id": 21, "page_no": 11, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 320.817, "t": 607.822, "r": 332.872, "b": 616.374, "coord_origin": "TOPLEFT"}, "confidence": 0.7716891169548035, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9b."}, {"label": "formula", "id": 12, "page_no": 11, "cluster": {"id": 12, "label": "formula", "bbox": {"l": 112.028, "t": 624.104, "r": 157.952, "b": 632.81, "coord_origin": "TOPLEFT"}, "confidence": 0.9298412799835205, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "alignment"}, {"label": "list_item", "id": 18, "page_no": 11, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 320.817, "t": 632.083, "r": 332.712, "b": 640.635, "coord_origin": "TOPLEFT"}, "confidence": 0.8584907054901123, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9c."}, {"label": "list_item", "id": 22, "page_no": 11, "cluster": {"id": 22, "label": "list_item", "bbox": {"l": 320.817, "t": 668.299, "r": 545.115, "b": 676.851, "coord_origin": "TOPLEFT"}, "confidence": 0.7590745091438293, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9d. Intersect the orphan's bounding box with the column"}, {"label": "text", "id": 7, "page_no": 11, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 668.3340000000001, "r": 74.451, "b": 676.886, "coord_origin": "TOPLEFT"}, "confidence": 0.9545555114746094, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where"}, {"label": "list_item", "id": 13, "page_no": 11, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 62.067, "t": 692.559, "r": 69.539, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.9260510206222534, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5."}, {"label": "list_item", "id": 25, "page_no": 11, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 320.817, "t": 692.559, "r": 545.115, "b": 701.111, "coord_origin": "TOPLEFT"}, "confidence": 0.6971189975738525, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9e. If the table cell under the identified row and column"}, {"label": "picture", "id": 30, "page_no": 11, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT"}, "confidence": 0.6033818125724792, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 14, "page_no": 11, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9126598238945007, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12"}]}}, {"page_no": 12, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.316, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 78.316, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Otherwise create a new structural cell and match it", "orig": "Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 127.033, "r_y1": 107.93899999999996, "r_x2": 127.033, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.70600000000002, "r_x1": 234.061, "r_y1": 131.70600000000002, "r_x2": 234.061, "r_y2": 123.11800000000005, "r_x3": 50.112, "r_y3": 123.11800000000005, "coord_origin": "TOPLEFT"}, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.174, "r_y0": 510.877, "r_x1": 273.133, "r_y1": 510.877, "r_x2": 273.133, "r_y2": 502.325, "r_x3": 105.174, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Example of a table with multi-line header.", "orig": "Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.787, "r_y0": 315.419, "r_x1": 545.115, "r_y1": 315.419, "r_x2": 545.115, "r_y2": 306.867, "r_x3": 352.787, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 327.374, "r_x1": 355.895, "r_y1": 327.374, "r_x2": 355.895, "r_y2": 318.822, "r_x3": 308.862, "r_y3": 318.822, "coord_origin": "TOPLEFT"}, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.157, "r_y0": 689.314, "r_x1": 541.632, "r_y1": 689.314, "r_x2": 541.632, "r_y2": 680.762, "r_x3": 359.157, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Example of a complex table with empty cells.", "orig": "Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 88.847, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.7545598149299622, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 87.43200000000002, "r": 72.856, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9170762300491333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 111.16300000000001, "r": 286.365, "b": 119.75099999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9454683065414429, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 306.867, "r": 345.634, "b": 315.419, "coord_origin": "TOPLEFT"}, "confidence": 0.8773345351219177, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "caption", "bbox": {"l": 63.341, "t": 502.325, "r": 99.595, "b": 510.877, "coord_origin": "TOPLEFT"}, "confidence": 0.8971090316772461, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "caption", "bbox": {"l": 312.343, "t": 680.762, "r": 353.578, "b": 689.314, "coord_origin": "TOPLEFT"}, "confidence": 0.9188510179519653, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9020507335662842, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, {"id": 19, "label": "picture", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.6956620812416077, "cells": [], "children": []}, {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, {"id": 13, "label": "picture", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.8023569583892822, "cells": [], "children": []}, {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"17": {"label": "table", "id": 17, "page_no": 12, "cluster": {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "32": {"label": "table", "id": 32, "page_no": 12, "cluster": {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "9": {"label": "table", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "21": {"label": "table", "id": 21, "page_no": 12, "cluster": {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "4": {"label": "table", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "37": {"label": "table", "id": 37, "page_no": 12, "cluster": {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "6": {"label": "table", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "12": {"label": "table", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "0": {"label": "table", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "10": {"label": "table", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "5": {"label": "table", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "30": {"label": "table", "id": 30, "page_no": 12, "cluster": {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 14, "page_no": 12, "cluster": {"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 88.847, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.7545598149299622, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "phan cell."}, {"label": "text", "id": 3, "page_no": 12, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 87.43200000000002, "r": 72.856, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9170762300491333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9f."}, {"label": "text", "id": 1, "page_no": 12, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 111.16300000000001, "r": 286.365, "b": 119.75099999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9454683065414429, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aditional images with examples of TableFormer predic-"}, {"label": "caption", "id": 11, "page_no": 12, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 306.867, "r": 345.634, "b": 315.419, "coord_origin": "TOPLEFT"}, "confidence": 0.8773345351219177, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 9:"}, {"label": "caption", "id": 8, "page_no": 12, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 63.341, "t": 502.325, "r": 99.595, "b": 510.877, "coord_origin": "TOPLEFT"}, "confidence": 0.8971090316772461, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 8:"}, {"label": "caption", "id": 2, "page_no": 12, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 312.343, "t": 680.762, "r": 353.578, "b": 689.314, "coord_origin": "TOPLEFT"}, "confidence": 0.9188510179519653, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 10:"}, {"label": "page_footer", "id": 7, "page_no": 12, "cluster": {"id": 7, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9020507335662842, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13"}, {"label": "table", "id": 17, "page_no": 12, "cluster": {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 32, "page_no": 12, "cluster": {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 21, "page_no": 12, "cluster": {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 19, "page_no": 12, "cluster": {"id": 19, "label": "picture", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.6956620812416077, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 37, "page_no": 12, "cluster": {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 13, "page_no": 12, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.8023569583892822, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 30, "page_no": 12, "cluster": {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "text", "id": 14, "page_no": 12, "cluster": {"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 88.847, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.7545598149299622, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "phan cell."}, {"label": "text", "id": 3, "page_no": 12, "cluster": {"id": 3, "label": "text", "bbox": {"l": 62.067, "t": 87.43200000000002, "r": 72.856, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9170762300491333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9f."}, {"label": "text", "id": 1, "page_no": 12, "cluster": {"id": 1, "label": "text", "bbox": {"l": 62.067, "t": 111.16300000000001, "r": 286.365, "b": 119.75099999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9454683065414429, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aditional images with examples of TableFormer predic-"}, {"label": "caption", "id": 11, "page_no": 12, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 306.867, "r": 345.634, "b": 315.419, "coord_origin": "TOPLEFT"}, "confidence": 0.8773345351219177, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 9:"}, {"label": "caption", "id": 8, "page_no": 12, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 63.341, "t": 502.325, "r": 99.595, "b": 510.877, "coord_origin": "TOPLEFT"}, "confidence": 0.8971090316772461, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 8:"}, {"label": "caption", "id": 2, "page_no": 12, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 312.343, "t": 680.762, "r": 353.578, "b": 689.314, "coord_origin": "TOPLEFT"}, "confidence": 0.9188510179519653, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 10:"}, {"label": "table", "id": 17, "page_no": 12, "cluster": {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 32, "page_no": 12, "cluster": {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 21, "page_no": 12, "cluster": {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 19, "page_no": 12, "cluster": {"id": 19, "label": "picture", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.6956620812416077, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 37, "page_no": 12, "cluster": {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 13, "page_no": 12, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.8023569583892822, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 30, "page_no": 12, "cluster": {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_footer", "id": 7, "page_no": 12, "cluster": {"id": 7, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9020507335662842, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13"}]}}, {"page_no": 13, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.731, "r_y0": 365.591, "r_x1": 215.67, "r_y1": 365.591, "r_x2": 215.67, "r_y2": 357.039, "r_x3": 103.731, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Simple table with different", "orig": "Simple table with different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.865, "r_y0": 365.591, "r_x1": 238.684, "r_y1": 365.591, "r_x2": 238.684, "r_y2": 357.039, "r_x3": 219.865, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.878, "r_y0": 365.591, "r_x1": 286.365, "r_y1": 365.591, "r_x2": 286.365, "r_y2": 357.039, "r_x3": 242.878, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "and empty", "orig": "and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 377.546, "r_x1": 70.864, "r_y1": 377.546, "r_x2": 70.864, "r_y2": 368.994, "r_x3": 50.112, "r_y3": 368.994, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.433, "r_y0": 680.639, "r_x1": 281.856, "r_y1": 680.639, "r_x2": 281.856, "r_y2": 672.087, "r_x3": 101.433, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Simple table predictions and post processing.", "orig": "Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.604, "r_y0": 380.505, "r_x1": 538.185, "r_y1": 380.505, "r_x2": 538.185, "r_y2": 371.953, "r_x3": 362.604, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Table predictions example on colorful table.", "orig": "Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.799, "r_y0": 692.367, "r_x1": 508.989, "r_y1": 692.367, "r_x2": 508.989, "r_y2": 683.815, "r_x3": 391.799, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Example with multi-line text.", "orig": "Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 357.039, "r": 93.051, "b": 365.591, "coord_origin": "TOPLEFT"}, "confidence": 0.951069176197052, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "caption", "bbox": {"l": 315.79, "t": 371.953, "r": 357.025, "b": 380.505, "coord_origin": "TOPLEFT"}, "confidence": 0.9178510904312134, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "caption", "bbox": {"l": 54.619, "t": 672.087, "r": 95.854, "b": 680.639, "coord_origin": "TOPLEFT"}, "confidence": 0.926384687423706, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "caption", "bbox": {"l": 344.985, "t": 683.815, "r": 386.22, "b": 692.367, "coord_origin": "TOPLEFT"}, "confidence": 0.9191023111343384, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.887715220451355, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "picture", "bbox": {"l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT"}, "confidence": 0.5003598928451538, "cells": [], "children": []}, {"id": 30, "label": "picture", "bbox": {"l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT"}, "confidence": 0.5613773465156555, "cells": [], "children": []}, {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, {"id": 11, "label": "picture", "bbox": {"l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT"}, "confidence": 0.7871124744415283, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"23": {"label": "table", "id": 23, "page_no": 13, "cluster": {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "33": {"label": "table", "id": 33, "page_no": 13, "cluster": {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "27": {"label": "table", "id": 27, "page_no": 13, "cluster": {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "38": {"label": "table", "id": 38, "page_no": 13, "cluster": {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "10": {"label": "table", "id": 10, "page_no": 13, "cluster": {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "9": {"label": "table", "id": 9, "page_no": 13, "cluster": {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "8": {"label": "table", "id": 8, "page_no": 13, "cluster": {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "4": {"label": "table", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "15": {"label": "table", "id": 15, "page_no": 13, "cluster": {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "6": {"label": "table", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "7": {"label": "table", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 0, "page_no": 13, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 357.039, "r": 93.051, "b": 365.591, "coord_origin": "TOPLEFT"}, "confidence": 0.951069176197052, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 11:"}, {"label": "caption", "id": 3, "page_no": 13, "cluster": {"id": 3, "label": "caption", "bbox": {"l": 315.79, "t": 371.953, "r": 357.025, "b": 380.505, "coord_origin": "TOPLEFT"}, "confidence": 0.9178510904312134, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 13:"}, {"label": "caption", "id": 1, "page_no": 13, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 54.619, "t": 672.087, "r": 95.854, "b": 680.639, "coord_origin": "TOPLEFT"}, "confidence": 0.926384687423706, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 12:"}, {"label": "caption", "id": 2, "page_no": 13, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 344.985, "t": 683.815, "r": 386.22, "b": 692.367, "coord_origin": "TOPLEFT"}, "confidence": 0.9191023111343384, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 14:"}, {"label": "page_footer", "id": 5, "page_no": 13, "cluster": {"id": 5, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.887715220451355, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14"}, {"label": "picture", "id": 41, "page_no": 13, "cluster": {"id": 41, "label": "picture", "bbox": {"l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT"}, "confidence": 0.5003598928451538, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 30, "page_no": 13, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT"}, "confidence": 0.5613773465156555, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 23, "page_no": 13, "cluster": {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 33, "page_no": 13, "cluster": {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 27, "page_no": 13, "cluster": {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 38, "page_no": 13, "cluster": {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 13, "cluster": {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 13, "cluster": {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 8, "page_no": 13, "cluster": {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 15, "page_no": 13, "cluster": {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 11, "page_no": 13, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT"}, "confidence": 0.7871124744415283, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 0, "page_no": 13, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 357.039, "r": 93.051, "b": 365.591, "coord_origin": "TOPLEFT"}, "confidence": 0.951069176197052, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 11:"}, {"label": "caption", "id": 3, "page_no": 13, "cluster": {"id": 3, "label": "caption", "bbox": {"l": 315.79, "t": 371.953, "r": 357.025, "b": 380.505, "coord_origin": "TOPLEFT"}, "confidence": 0.9178510904312134, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 13:"}, {"label": "caption", "id": 1, "page_no": 13, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 54.619, "t": 672.087, "r": 95.854, "b": 680.639, "coord_origin": "TOPLEFT"}, "confidence": 0.926384687423706, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 12:"}, {"label": "caption", "id": 2, "page_no": 13, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 344.985, "t": 683.815, "r": 386.22, "b": 692.367, "coord_origin": "TOPLEFT"}, "confidence": 0.9191023111343384, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 14:"}, {"label": "picture", "id": 41, "page_no": 13, "cluster": {"id": 41, "label": "picture", "bbox": {"l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT"}, "confidence": 0.5003598928451538, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 30, "page_no": 13, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT"}, "confidence": 0.5613773465156555, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 23, "page_no": 13, "cluster": {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 33, "page_no": 13, "cluster": {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 27, "page_no": 13, "cluster": {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 38, "page_no": 13, "cluster": {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 13, "cluster": {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 13, "cluster": {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 8, "page_no": 13, "cluster": {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 15, "page_no": 13, "cluster": {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 11, "page_no": 13, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT"}, "confidence": 0.7871124744415283, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 5, "page_no": 13, "cluster": {"id": 5, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.887715220451355, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14"}]}}, {"page_no": 14, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.047, "r_y0": 653.172, "r_x1": 252.242, "r_y1": 653.172, "r_x2": 252.242, "r_y2": 644.62, "r_x3": 131.047, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Example with triangular table.", "orig": "Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.341, "r_y0": 661.756, "r_x1": 545.115, "r_y1": 661.756, "r_x2": 545.115, "r_y2": 653.204, "r_x3": 354.341, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Example of how post-processing helps to restore", "orig": "Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 673.711, "r_x1": 497.603, "r_y1": 673.711, "r_x2": 497.603, "r_y2": 665.159, "r_x3": 308.862, "r_y3": 665.159, "coord_origin": "TOPLEFT"}, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 0, "label": "caption", "bbox": {"l": 84.233, "t": 644.62, "r": 125.468, "b": 653.172, "coord_origin": "TOPLEFT"}, "confidence": 0.9257225394248962, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "caption", "bbox": {"l": 308.862, "t": 653.204, "r": 349.559, "b": 661.756, "coord_origin": "TOPLEFT"}, "confidence": 0.9134758710861206, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9037020802497864, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, {"id": 6, "label": "picture", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.8099280595779419, "cells": [], "children": []}, {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, {"id": 18, "label": "picture", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.567050039768219, "cells": [], "children": []}, {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, {"id": 20, "label": "picture", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.5515198707580566, "cells": [], "children": []}, {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, {"id": 5, "label": "picture", "bbox": {"l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT"}, "confidence": 0.8410326838493347, "cells": [], "children": []}, {"id": 22, "label": "picture", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.5478786826133728, "cells": [], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, {"id": 7, "label": "picture", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.8057592511177063, "cells": [], "children": []}, {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"4": {"label": "table", "id": 4, "page_no": 14, "cluster": {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "19": {"label": "table", "id": 19, "page_no": 14, "cluster": {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "2": {"label": "table", "id": 2, "page_no": 14, "cluster": {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "10": {"label": "table", "id": 10, "page_no": 14, "cluster": {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "9": {"label": "table", "id": 9, "page_no": 14, "cluster": {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "8": {"label": "table", "id": 8, "page_no": 14, "cluster": {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "11": {"label": "table", "id": 11, "page_no": 14, "cluster": {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 0, "page_no": 14, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 84.233, "t": 644.62, "r": 125.468, "b": 653.172, "coord_origin": "TOPLEFT"}, "confidence": 0.9257225394248962, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 15:"}, {"label": "caption", "id": 1, "page_no": 14, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 308.862, "t": 653.204, "r": 349.559, "b": 661.756, "coord_origin": "TOPLEFT"}, "confidence": 0.9134758710861206, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 16:"}, {"label": "page_footer", "id": 3, "page_no": 14, "cluster": {"id": 3, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9037020802497864, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "15"}, {"label": "table", "id": 4, "page_no": 14, "cluster": {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 6, "page_no": 14, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.8099280595779419, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 19, "page_no": 14, "cluster": {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 2, "page_no": 14, "cluster": {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 18, "page_no": 14, "cluster": {"id": 18, "label": "picture", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.567050039768219, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 10, "page_no": 14, "cluster": {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 20, "page_no": 14, "cluster": {"id": 20, "label": "picture", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.5515198707580566, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 9, "page_no": 14, "cluster": {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 5, "page_no": 14, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT"}, "confidence": 0.8410326838493347, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 22, "page_no": 14, "cluster": {"id": 22, "label": "picture", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.5478786826133728, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 8, "page_no": 14, "cluster": {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 7, "page_no": 14, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.8057592511177063, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 14, "cluster": {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "caption", "id": 0, "page_no": 14, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 84.233, "t": 644.62, "r": 125.468, "b": 653.172, "coord_origin": "TOPLEFT"}, "confidence": 0.9257225394248962, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 15:"}, {"label": "caption", "id": 1, "page_no": 14, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 308.862, "t": 653.204, "r": 349.559, "b": 661.756, "coord_origin": "TOPLEFT"}, "confidence": 0.9134758710861206, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 16:"}, {"label": "table", "id": 4, "page_no": 14, "cluster": {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 6, "page_no": 14, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.8099280595779419, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 19, "page_no": 14, "cluster": {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 2, "page_no": 14, "cluster": {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 18, "page_no": 14, "cluster": {"id": 18, "label": "picture", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.567050039768219, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 10, "page_no": 14, "cluster": {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 20, "page_no": 14, "cluster": {"id": 20, "label": "picture", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.5515198707580566, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 9, "page_no": 14, "cluster": {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 5, "page_no": 14, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT"}, "confidence": 0.8410326838493347, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 22, "page_no": 14, "cluster": {"id": 22, "label": "picture", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.5478786826133728, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 8, "page_no": 14, "cluster": {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 7, "page_no": 14, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.8057592511177063, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 14, "cluster": {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_footer", "id": 3, "page_no": 14, "cluster": {"id": 3, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9037020802497864, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "15"}]}}, {"page_no": 15, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.558, "r_y0": 517.158, "r_x1": 545.114, "r_y1": 517.158, "r_x2": 545.114, "r_y2": 508.606, "r_x3": 96.558, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 529.113, "r_x1": 173.24, "r_y1": 529.113, "r_x2": 173.24, "r_y2": 520.5609999999999, "r_x3": 50.112, "r_y3": 520.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 508.606, "r": 91.198, "b": 517.158, "coord_origin": "TOPLEFT"}, "confidence": 0.9624594449996948, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9134101271629333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "picture", "bbox": {"l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT"}, "confidence": 0.6913455724716187, "cells": [], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 0, "page_no": 15, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 508.606, "r": 91.198, "b": 517.158, "coord_origin": "TOPLEFT"}, "confidence": 0.9624594449996948, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 17:"}, {"label": "page_footer", "id": 1, "page_no": 15, "cluster": {"id": 1, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9134101271629333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "16"}, {"label": "picture", "id": 2, "page_no": 15, "cluster": {"id": 2, "label": "picture", "bbox": {"l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT"}, "confidence": 0.6913455724716187, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 0, "page_no": 15, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 508.606, "r": 91.198, "b": 517.158, "coord_origin": "TOPLEFT"}, "confidence": 0.9624594449996948, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 17:"}, {"label": "picture", "id": 2, "page_no": 15, "cluster": {"id": 2, "label": "picture", "bbox": {"l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT"}, "confidence": 0.6913455724716187, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 1, "page_no": 15, "cluster": {"id": 1, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9134101271629333, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "16"}]}}]