[ { "page_no": 0, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.301003, "r_y0": 119.93133999999998, "r_x1": 498.92708999999996, "r_y1": 119.93133999999998, "r_x2": 498.92708999999996, "r_y2": 107.03412000000003, "r_x3": 96.301003, "r_y3": 107.03412000000003, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.47701, "r_y0": 157.37334999999996, "r_x1": 452.75027, "r_y1": 157.37334999999996, "r_x2": 452.75027, "r_y2": 146.68535999999995, "r_x3": 142.47701, "r_y3": 146.68535999999995, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.918, "r_y0": 171.32037000000003, "r_x1": 332.30597, "r_y1": 171.32037000000003, "r_x2": 332.30597, "r_y2": 160.63239, "r_x3": 262.918, "r_y3": 160.63239, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.123, "r_y0": 184.42553999999996, "r_x1": 212.73083, "r_y1": 184.42553999999996, "r_x2": 212.73083, "r_y2": 175.96123999999998, "r_x3": 208.123, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.00409000000002, "r_x1": 293.42761, "r_y1": 184.00409000000002, "r_x2": 293.42761, "r_y2": 177.08203000000003, "r_x3": 212.73, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.42798, "r_y0": 184.42553999999996, "r_x1": 298.0358, "r_y1": 184.42553999999996, "r_x2": 298.0358, "r_y2": 175.96123999999998, "r_x3": 293.42798, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03497, "r_y0": 184.00409000000002, "r_x1": 378.73257, "r_y1": 184.00409000000002, "r_x2": 378.73257, "r_y2": 177.08203000000003, "r_x3": 298.03497, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99498, "r_y0": 226.23071000000004, "r_x1": 190.48029, "r_y1": 226.23071000000004, "r_x2": 190.48029, "r_y2": 215.48297000000002, "r_x3": 145.99498, "r_y3": 215.48297000000002, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 249.98284999999998, "r_x1": 286.36493, "r_y1": 249.98284999999998, "r_x2": 286.36493, "r_y2": 241.39508, "r_x3": 62.066978, "r_y3": 241.39508, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 261.93787, "r_x1": 286.36508, "r_y1": 261.93787, "r_x2": 286.36508, "r_y2": 253.3501, "r_x3": 50.111977, "r_y3": 253.3501, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 273.89288, "r_x1": 286.36508, "r_y1": 273.89288, "r_x2": 286.36508, "r_y2": 265.30511, "r_x3": 50.111977, "r_y3": 265.30511, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 285.84888, "r_x1": 286.36505, "r_y1": 285.84888, "r_x2": 286.36505, "r_y2": 277.26111000000003, "r_x3": 50.111977, "r_y3": 277.26111000000003, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 297.80386, "r_x1": 286.36505, "r_y1": 297.80386, "r_x2": 286.36505, "r_y2": 289.21609, "r_x3": 50.111977, "r_y3": 289.21609, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 309.75884999999994, "r_x1": 286.36505, "r_y1": 309.75884999999994, "r_x2": 286.36505, "r_y2": 301.17108, "r_x3": 50.111977, "r_y3": 301.17108, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 321.71384, "r_x1": 286.36508, "r_y1": 321.71384, "r_x2": 286.36508, "r_y2": 313.12607, "r_x3": 50.111977, "r_y3": 313.12607, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 333.66882, "r_x1": 286.36508, "r_y1": 333.66882, "r_x2": 286.36508, "r_y2": 325.08105, "r_x3": 50.111977, "r_y3": 325.08105, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 345.62381, "r_x1": 286.36505, "r_y1": 345.62381, "r_x2": 286.36505, "r_y2": 337.03604, "r_x3": 50.111977, "r_y3": 337.03604, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 357.5798, "r_x1": 286.36508, "r_y1": 357.5798, "r_x2": 286.36508, "r_y2": 348.99203, "r_x3": 50.111977, "r_y3": 348.99203, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 369.53479, "r_x1": 286.36505, "r_y1": 369.53479, "r_x2": 286.36505, "r_y2": 360.94701999999995, "r_x3": 50.111977, "r_y3": 360.94701999999995, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 381.48978, "r_x1": 286.36508, "r_y1": 381.48978, "r_x2": 286.36508, "r_y2": 372.90201, "r_x3": 50.111977, "r_y3": 372.90201, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 393.44476, "r_x1": 286.36505, "r_y1": 393.44476, "r_x2": 286.36505, "r_y2": 384.85699, "r_x3": 50.111977, "r_y3": 384.85699, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 405.39975000000004, "r_x1": 286.36511, "r_y1": 405.39975000000004, "r_x2": 286.36511, "r_y2": 396.81198, "r_x3": 50.111977, "r_y3": 396.81198, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 417.35474, "r_x1": 286.36508, "r_y1": 417.35474, "r_x2": 286.36508, "r_y2": 408.76697, "r_x3": 50.111977, "r_y3": 408.76697, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 429.31073, "r_x1": 286.36505, "r_y1": 429.31073, "r_x2": 286.36505, "r_y2": 420.72296000000006, "r_x3": 50.111977, "r_y3": 420.72296000000006, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 441.26572, "r_x1": 207.23216, "r_y1": 441.26572, "r_x2": 207.23216, "r_y2": 432.67795, "r_x3": 50.111977, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.09639, "r_y0": 441.26572, "r_x1": 286.36508, "r_y1": 441.26572, "r_x2": 286.36508, "r_y2": 432.67795, "r_x3": 214.09639, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 453.2207, "r_x1": 286.36508, "r_y1": 453.2207, "r_x2": 286.36508, "r_y2": 444.63293, "r_x3": 50.111977, "r_y3": 444.63293, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 465.17569, "r_x1": 286.36505, "r_y1": 465.17569, "r_x2": 286.36505, "r_y2": 456.58792000000005, "r_x3": 50.111977, "r_y3": 456.58792000000005, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 477.13068, "r_x1": 286.36505, "r_y1": 477.13068, "r_x2": 286.36505, "r_y2": 468.54291, "r_x3": 50.111977, "r_y3": 468.54291, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 489.08667, "r_x1": 286.36508, "r_y1": 489.08667, "r_x2": 286.36508, "r_y2": 480.4989, "r_x3": 50.111977, "r_y3": 480.4989, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 501.04166, "r_x1": 286.36505, "r_y1": 501.04166, "r_x2": 286.36505, "r_y2": 492.45389, "r_x3": 50.111977, "r_y3": 492.45389, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 512.9966400000001, "r_x1": 276.65152, "r_y1": 512.9966400000001, "r_x2": 276.65152, "r_y2": 504.40887, "r_x3": 50.111977, "r_y3": 504.40887, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 550.69049, "r_x1": 58.121296, "r_y1": 550.69049, "r_x2": 58.121296, "r_y2": 539.94276, "r_x3": 50.111977, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.800385, "r_y0": 550.69049, "r_x1": 126.94804, "r_y1": 550.69049, "r_x2": 126.94804, "r_y2": 539.94276, "r_x3": 68.800385, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 569.68976, "r_x1": 286.36496, "r_y1": 569.68976, "r_x2": 286.36496, "r_y2": 560.7832, "r_x3": 62.066978, "r_y3": 560.7832, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 581.64476, "r_x1": 286.36508, "r_y1": 581.64476, "r_x2": 286.36508, "r_y2": 572.7382, "r_x3": 50.111977, "r_y3": 572.7382, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 593.5997600000001, "r_x1": 286.36505, "r_y1": 593.5997600000001, "r_x2": 286.36505, "r_y2": 584.69321, "r_x3": 50.111977, "r_y3": 584.69321, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 605.55576, "r_x1": 286.36505, "r_y1": 605.55576, "r_x2": 286.36505, "r_y2": 596.6492000000001, "r_x3": 50.111977, "r_y3": 596.6492000000001, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 617.51076, "r_x1": 286.36505, "r_y1": 617.51076, "r_x2": 286.36505, "r_y2": 608.6042, "r_x3": 50.111977, "r_y3": 608.6042, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 629.46576, "r_x1": 286.36505, "r_y1": 629.46576, "r_x2": 286.36505, "r_y2": 620.5592, "r_x3": 50.111977, "r_y3": 620.5592, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 641.42076, "r_x1": 286.36508, "r_y1": 641.42076, "r_x2": 286.36508, "r_y2": 632.51421, "r_x3": 50.111977, "r_y3": 632.51421, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 653.37576, "r_x1": 286.36508, "r_y1": 653.37576, "r_x2": 286.36508, "r_y2": 644.46921, "r_x3": 50.111977, "r_y3": 644.46921, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 665.33077, "r_x1": 286.36502, "r_y1": 665.33077, "r_x2": 286.36502, "r_y2": 656.42421, "r_x3": 50.111977, "r_y3": 656.42421, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 677.28677, "r_x1": 286.36505, "r_y1": 677.28677, "r_x2": 286.36505, "r_y2": 668.3802000000001, "r_x3": 50.111977, "r_y3": 668.3802000000001, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 689.2417800000001, "r_x1": 286.36505, "r_y1": 689.2417800000001, "r_x2": 286.36505, "r_y2": 680.33521, "r_x3": 50.111977, "r_y3": 680.33521, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 701.196777, "r_x1": 286.36505, "r_y1": 701.196777, "r_x2": 286.36505, "r_y2": 692.290207, "r_x3": 50.111977, "r_y3": 692.290207, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 713.151779, "r_x1": 76.403275, "r_y1": 713.151779, "r_x2": 76.403275, "r_y2": 704.245209, "r_x3": 50.111977, "r_y3": 704.245209, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 226.75482, "r_x1": 324.01007, "r_y1": 226.75482, "r_x2": 324.01007, "r_y2": 218.00684, "r_x3": 315.56702, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.2316, "r_y0": 226.75482, "r_x1": 408.4407, "r_y1": 226.75482, "r_x2": 408.4407, "r_y2": 218.00684, "r_x3": 328.2316, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 322.44281, "r_x1": 325.05786, "r_y1": 322.44281, "r_x2": 325.05786, "r_y2": 313.69478999999995, "r_x3": 315.56702, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.80325, "r_y0": 322.44281, "r_x1": 486.40194999999994, "r_y1": 322.44281, "r_x2": 486.40194999999994, "r_y2": 313.69478999999995, "r_x3": 329.80325, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46252, "r_y0": 333.2428, "r_x1": 472.47411999999997, "r_y1": 333.2428, "r_x2": 472.47411999999997, "r_y2": 324.49478, "r_x3": 326.46252, "r_y3": 324.49478, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 428.93082, "r_x1": 324.81039, "r_y1": 428.93082, "r_x2": 324.81039, "r_y2": 420.1828, "r_x3": 315.56702, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.4321, "r_y0": 428.93082, "r_x1": 491.1912500000001, "r_y1": 428.93082, "r_x2": 491.1912500000001, "r_y2": 420.1828, "r_x3": 329.4321, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.14752, "r_y0": 351.61322, "r_x1": 412.54001, "r_y1": 351.61322, "r_x2": 412.54001, "r_y2": 342.82828, "r_x3": 408.14752, "r_y3": 342.82828, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11011, "r_y0": 350.35712, "r_x1": 360.50259, "r_y1": 350.35712, "r_x2": 360.50259, "r_y2": 341.57217, "r_x3": 356.11011, "r_y3": 341.57217, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.6777, "r_y0": 349.7226299999999, "r_x1": 505.0701900000001, "r_y1": 349.7226299999999, "r_x2": 505.0701900000001, "r_y2": 340.93768, "r_x3": 500.6777, "r_y3": 340.93768, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13382, "r_y0": 360.53284, "r_x1": 360.52631, "r_y1": 360.53284, "r_x2": 360.52631, "r_y2": 351.74789, "r_x3": 356.13382, "r_y3": 351.74789, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.53992, "r_y0": 364.66144, "r_x1": 406.9324, "r_y1": 364.66144, "r_x2": 406.9324, "r_y2": 355.8765, "r_x3": 402.53992, "r_y3": 355.8765, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58178999999996, "r_y0": 361.62512, "r_x1": 452.97427, "r_y1": 361.62512, "r_x2": 452.97427, "r_y2": 352.84018, "r_x3": 448.58178999999996, "r_y3": 352.84018, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65161000000006, "r_y0": 362.49152, "r_x1": 496.0441, "r_y1": 362.49152, "r_x2": 496.0441, "r_y2": 353.70657, "r_x3": 491.65161000000006, "r_y3": 353.70657, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.13843, "r_y0": 362.12463, "r_x1": 539.53088, "r_y1": 362.12463, "r_x2": 539.53088, "r_y2": 353.33969, "r_x3": 535.13843, "r_y3": 353.33969, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.82822, "r_y0": 395.88275, "r_x1": 353.2207, "r_y1": 395.88275, "r_x2": 353.2207, "r_y2": 387.09781, "r_x3": 348.82822, "r_y3": 387.09781, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27151, "r_y0": 384.15723, "r_x1": 393.664, "r_y1": 384.15723, "r_x2": 393.664, "r_y2": 375.37228, "r_x3": 389.27151, "r_y3": 375.37228, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67479999999995, "r_y0": 384.43115, "r_x1": 451.45889000000005, "r_y1": 384.43115, "r_x2": 451.45889000000005, "r_y2": 375.64621, "r_x3": 442.67479999999995, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.4382299999999, "r_y0": 384.31894000000005, "r_x1": 485.90167, "r_y1": 384.31894000000005, "r_x2": 485.90167, "r_y2": 375.534, "r_x3": 477.4382299999999, "r_y3": 375.534, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57263, "r_y0": 384.43115, "r_x1": 531.35669, "r_y1": 384.43115, "r_x2": 531.35669, "r_y2": 375.64621, "r_x3": 522.57263, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.22992, "r_y0": 395.89923, "r_x1": 409.01401, "r_y1": 395.89923, "r_x2": 409.01401, "r_y2": 387.11429, "r_x3": 400.22992, "r_y3": 387.11429, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30792, "r_y0": 395.77475000000004, "r_x1": 451.0920100000001, "r_y1": 395.77475000000004, "r_x2": 451.0920100000001, "r_y2": 386.98981000000003, "r_x3": 442.30792, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.21941999999996, "r_y0": 396.15964, "r_x1": 487.00351000000006, "r_y1": 396.15964, "r_x2": 487.00351000000006, "r_y2": 387.37469, "r_x3": 478.21941999999996, "r_y3": 387.37469, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.2287, "r_y0": 395.77475000000004, "r_x1": 532.01276, "r_y1": 395.77475000000004, "r_x2": 532.01276, "r_y2": 386.98981000000003, "r_x3": 523.2287, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57233, "r_y0": 408.20972, "r_x1": 415.96481, "r_y1": 408.20972, "r_x2": 415.96481, "r_y2": 399.42477, "r_x3": 411.57233, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96393, "r_y0": 408.20972, "r_x1": 420.35641, "r_y1": 408.20972, "r_x2": 420.35641, "r_y2": 399.42477, "r_x3": 415.96393, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30521, "r_y0": 407.82213999999993, "r_x1": 451.08929, "r_y1": 407.82213999999993, "r_x2": 451.08929, "r_y2": 399.0371999999999, "r_x3": 442.30521, "r_y3": 399.0371999999999, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.77893, "r_y0": 407.78133999999994, "r_x1": 487.56302, "r_y1": 407.78133999999994, "r_x2": 487.56302, "r_y2": 398.99639999999994, "r_x3": 478.77893, "r_y3": 398.99639999999994, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97241, "r_y0": 407.39642, "r_x1": 532.75647, "r_y1": 407.39642, "r_x2": 532.75647, "r_y2": 398.6114799999999, "r_x3": 523.97241, "r_y3": 398.6114799999999, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09399, "r_y0": 367.89072, "r_x1": 391.09879, "r_y1": 367.89072, "r_x2": 391.09879, "r_y2": 357.76030999999995, "r_x3": 385.09399, "r_y3": 357.76030999999995, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43451, "r_y0": 390.85689999999994, "r_x1": 339.4393, "r_y1": 390.85689999999994, "r_x2": 339.4393, "r_y2": 380.7265, "r_x3": 333.43451, "r_y3": 380.7265, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07210999999995, "r_y0": 351.16720999999995, "r_x1": 484.0769, "r_y1": 351.16720999999995, "r_x2": 484.0769, "r_y2": 341.0368000000001, "r_x3": 478.07210999999995, "r_y3": 341.0368000000001, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 523.40692, "r_x1": 345.73361, "r_y1": 523.40692, "r_x2": 345.73361, "r_y2": 514.50037, "r_x3": 308.862, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.17566, "r_y0": 523.40692, "r_x1": 545.11511, "r_y1": 523.40692, "r_x2": 545.11511, "r_y2": 514.50037, "r_x3": 353.17566, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 535.3619100000001, "r_x1": 545.11511, "r_y1": 535.3619100000001, "r_x2": 545.11511, "r_y2": 526.45535, "r_x3": 308.862, "r_y3": 526.45535, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 547.31691, "r_x1": 545.11517, "r_y1": 547.31691, "r_x2": 545.11517, "r_y2": 538.41035, "r_x3": 308.862, "r_y3": 538.41035, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 559.2729, "r_x1": 505.6917700000001, "r_y1": 559.2729, "r_x2": 505.6917700000001, "r_y2": 550.36635, "r_x3": 308.862, "r_y3": 550.36635, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 593.31592, "r_x1": 545.11493, "r_y1": 593.31592, "r_x2": 545.11493, "r_y2": 584.40936, "r_x3": 320.81699, "r_y3": 584.40936, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2709199999999, "r_x1": 545.11517, "r_y1": 605.2709199999999, "r_x2": 545.11517, "r_y2": 596.36436, "r_x3": 308.862, "r_y3": 596.36436, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.22592, "r_x1": 545.11511, "r_y1": 617.22592, "r_x2": 545.11511, "r_y2": 608.31937, "r_x3": 308.862, "r_y3": 608.31937, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.18092, "r_x1": 545.11505, "r_y1": 629.18092, "r_x2": 545.11505, "r_y2": 620.27437, "r_x3": 308.862, "r_y3": 620.27437, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.13692, "r_x1": 353.6937, "r_y1": 641.13692, "r_x2": 353.6937, "r_y2": 632.23036, "r_x3": 308.862, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11209, "r_y0": 641.13692, "r_x1": 374.66617, "r_y1": 641.13692, "r_x2": 374.66617, "r_y2": 632.23036, "r_x3": 362.11209, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.35785, "r_y0": 641.13692, "r_x1": 545.11505, "r_y1": 641.13692, "r_x2": 545.11505, "r_y2": 632.23036, "r_x3": 377.35785, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.09192, "r_x1": 545.11517, "r_y1": 653.09192, "r_x2": 545.11517, "r_y2": 644.18536, "r_x3": 308.862, "r_y3": 644.18536, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.04693, "r_x1": 375.55167, "r_y1": 665.04693, "r_x2": 375.55167, "r_y2": 656.14037, "r_x3": 308.862, "r_y3": 656.14037, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 677.28693, "r_x1": 545.11493, "r_y1": 677.28693, "r_x2": 545.11493, "r_y2": 668.38036, "r_x3": 320.81699, "r_y3": 668.38036, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24193, "r_x1": 545.11511, "r_y1": 689.24193, "r_x2": 545.11511, "r_y2": 680.33536, "r_x3": 308.862, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.19693, "r_x1": 545.11511, "r_y1": 701.19693, "r_x2": 545.11511, "r_y2": 692.290359, "r_x3": 308.862, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151932, "r_x1": 545.11499, "r_y1": 713.151932, "r_x2": 545.11499, "r_y2": 704.245361, "r_x3": 308.862, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340221, "r_y0": 560.00003, "r_x1": 36.339779, "r_y1": 560.00003, "r_x2": 36.339779, "r_y2": 207.82001000000002, "r_x3": 18.340221, "r_y3": 207.82001000000002, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 8, "label": "section_header", "bbox": { "l": 96.301003, "t": 107.03412000000003, "r": 498.92708999999996, "b": 119.93133999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.8868067860603333, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.301003, "r_y0": 119.93133999999998, "r_x1": 498.92708999999996, "r_y1": 119.93133999999998, "r_x2": 498.92708999999996, "r_y2": 107.03412000000003, "r_x3": 96.301003, "r_y3": 107.03412000000003, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 142.47701, "t": 146.68535999999995, "r": 452.75027, "b": 171.32037000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.7586215734481812, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.47701, "r_y0": 157.37334999999996, "r_x1": 452.75027, "r_y1": 157.37334999999996, "r_x2": 452.75027, "r_y2": 146.68535999999995, "r_x3": 142.47701, "r_y3": 146.68535999999995, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.918, "r_y0": 171.32037000000003, "r_x1": 332.30597, "r_y1": 171.32037000000003, "r_x2": 332.30597, "r_y2": 160.63239, "r_x3": 262.918, "r_y3": 160.63239, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "key_value_region", "bbox": { "l": 208.123, "t": 175.96123999999998, "r": 378.73257, "b": 184.42553999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.4854728579521179, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.123, "r_y0": 184.42553999999996, "r_x1": 212.73083, "r_y1": 184.42553999999996, "r_x2": 212.73083, "r_y2": 175.96123999999998, "r_x3": 208.123, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.00409000000002, "r_x1": 293.42761, "r_y1": 184.00409000000002, "r_x2": 293.42761, "r_y2": 177.08203000000003, "r_x3": 212.73, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.42798, "r_y0": 184.42553999999996, "r_x1": 298.0358, "r_y1": 184.42553999999996, "r_x2": 298.0358, "r_y2": 175.96123999999998, "r_x3": 293.42798, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03497, "r_y0": 184.00409000000002, "r_x1": 378.73257, "r_y1": 184.00409000000002, "r_x2": 378.73257, "r_y2": 177.08203000000003, "r_x3": 298.03497, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 208.123, "t": 175.96123999999998, "r": 378.73257, "b": 184.42553999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9096331596374512, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.123, "r_y0": 184.42553999999996, "r_x1": 212.73083, "r_y1": 184.42553999999996, "r_x2": 212.73083, "r_y2": 175.96123999999998, "r_x3": 208.123, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.00409000000002, "r_x1": 293.42761, "r_y1": 184.00409000000002, "r_x2": 293.42761, "r_y2": 177.08203000000003, "r_x3": 212.73, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.42798, "r_y0": 184.42553999999996, "r_x1": 298.0358, "r_y1": 184.42553999999996, "r_x2": 298.0358, "r_y2": 175.96123999999998, "r_x3": 293.42798, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03497, "r_y0": 184.00409000000002, "r_x1": 378.73257, "r_y1": 184.00409000000002, "r_x2": 378.73257, "r_y2": 177.08203000000003, "r_x3": 298.03497, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 5, "label": "section_header", "bbox": { "l": 145.99498, "t": 215.48297000000002, "r": 190.48029, "b": 226.23071000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9258671402931213, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99498, "r_y0": 226.23071000000004, "r_x1": 190.48029, "r_y1": 226.23071000000004, "r_x2": 190.48029, "r_y2": 215.48297000000002, "r_x3": 145.99498, "r_y3": 215.48297000000002, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.111977, "t": 241.39508, "r": 286.36511, "b": 512.9966400000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9838882088661194, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 249.98284999999998, "r_x1": 286.36493, "r_y1": 249.98284999999998, "r_x2": 286.36493, "r_y2": 241.39508, "r_x3": 62.066978, "r_y3": 241.39508, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 261.93787, "r_x1": 286.36508, "r_y1": 261.93787, "r_x2": 286.36508, "r_y2": 253.3501, "r_x3": 50.111977, "r_y3": 253.3501, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 273.89288, "r_x1": 286.36508, "r_y1": 273.89288, "r_x2": 286.36508, "r_y2": 265.30511, "r_x3": 50.111977, "r_y3": 265.30511, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 285.84888, "r_x1": 286.36505, "r_y1": 285.84888, "r_x2": 286.36505, "r_y2": 277.26111000000003, "r_x3": 50.111977, "r_y3": 277.26111000000003, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 297.80386, "r_x1": 286.36505, "r_y1": 297.80386, "r_x2": 286.36505, "r_y2": 289.21609, "r_x3": 50.111977, "r_y3": 289.21609, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 309.75884999999994, "r_x1": 286.36505, "r_y1": 309.75884999999994, "r_x2": 286.36505, "r_y2": 301.17108, "r_x3": 50.111977, "r_y3": 301.17108, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 321.71384, "r_x1": 286.36508, "r_y1": 321.71384, "r_x2": 286.36508, "r_y2": 313.12607, "r_x3": 50.111977, "r_y3": 313.12607, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 333.66882, "r_x1": 286.36508, "r_y1": 333.66882, "r_x2": 286.36508, "r_y2": 325.08105, "r_x3": 50.111977, "r_y3": 325.08105, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 345.62381, "r_x1": 286.36505, "r_y1": 345.62381, "r_x2": 286.36505, "r_y2": 337.03604, "r_x3": 50.111977, "r_y3": 337.03604, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 357.5798, "r_x1": 286.36508, "r_y1": 357.5798, "r_x2": 286.36508, "r_y2": 348.99203, "r_x3": 50.111977, "r_y3": 348.99203, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 369.53479, "r_x1": 286.36505, "r_y1": 369.53479, "r_x2": 286.36505, "r_y2": 360.94701999999995, "r_x3": 50.111977, "r_y3": 360.94701999999995, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 381.48978, "r_x1": 286.36508, "r_y1": 381.48978, "r_x2": 286.36508, "r_y2": 372.90201, "r_x3": 50.111977, "r_y3": 372.90201, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 393.44476, "r_x1": 286.36505, "r_y1": 393.44476, "r_x2": 286.36505, "r_y2": 384.85699, "r_x3": 50.111977, "r_y3": 384.85699, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 405.39975000000004, "r_x1": 286.36511, "r_y1": 405.39975000000004, "r_x2": 286.36511, "r_y2": 396.81198, "r_x3": 50.111977, "r_y3": 396.81198, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 417.35474, "r_x1": 286.36508, "r_y1": 417.35474, "r_x2": 286.36508, "r_y2": 408.76697, "r_x3": 50.111977, "r_y3": 408.76697, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 429.31073, "r_x1": 286.36505, "r_y1": 429.31073, "r_x2": 286.36505, "r_y2": 420.72296000000006, "r_x3": 50.111977, "r_y3": 420.72296000000006, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 441.26572, "r_x1": 207.23216, "r_y1": 441.26572, "r_x2": 207.23216, "r_y2": 432.67795, "r_x3": 50.111977, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.09639, "r_y0": 441.26572, "r_x1": 286.36508, "r_y1": 441.26572, "r_x2": 286.36508, "r_y2": 432.67795, "r_x3": 214.09639, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 453.2207, "r_x1": 286.36508, "r_y1": 453.2207, "r_x2": 286.36508, "r_y2": 444.63293, "r_x3": 50.111977, "r_y3": 444.63293, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 465.17569, "r_x1": 286.36505, "r_y1": 465.17569, "r_x2": 286.36505, "r_y2": 456.58792000000005, "r_x3": 50.111977, "r_y3": 456.58792000000005, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 477.13068, "r_x1": 286.36505, "r_y1": 477.13068, "r_x2": 286.36505, "r_y2": 468.54291, "r_x3": 50.111977, "r_y3": 468.54291, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 489.08667, "r_x1": 286.36508, "r_y1": 489.08667, "r_x2": 286.36508, "r_y2": 480.4989, "r_x3": 50.111977, "r_y3": 480.4989, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 501.04166, "r_x1": 286.36505, "r_y1": 501.04166, "r_x2": 286.36505, "r_y2": 492.45389, "r_x3": 50.111977, "r_y3": 492.45389, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 512.9966400000001, "r_x1": 276.65152, "r_y1": 512.9966400000001, "r_x2": 276.65152, "r_y2": 504.40887, "r_x3": 50.111977, "r_y3": 504.40887, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 50.111977, "t": 539.94276, "r": 126.94804, "b": 550.69049, "coord_origin": "TOPLEFT" }, "confidence": 0.9317677617073059, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 550.69049, "r_x1": 58.121296, "r_y1": 550.69049, "r_x2": 58.121296, "r_y2": 539.94276, "r_x3": 50.111977, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.800385, "r_y0": 550.69049, "r_x1": 126.94804, "r_y1": 550.69049, "r_x2": 126.94804, "r_y2": 539.94276, "r_x3": 68.800385, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.111977, "t": 560.7832, "r": 286.36508, "b": 713.151779, "coord_origin": "TOPLEFT" }, "confidence": 0.9841895699501038, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 569.68976, "r_x1": 286.36496, "r_y1": 569.68976, "r_x2": 286.36496, "r_y2": 560.7832, "r_x3": 62.066978, "r_y3": 560.7832, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 581.64476, "r_x1": 286.36508, "r_y1": 581.64476, "r_x2": 286.36508, "r_y2": 572.7382, "r_x3": 50.111977, "r_y3": 572.7382, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 593.5997600000001, "r_x1": 286.36505, "r_y1": 593.5997600000001, "r_x2": 286.36505, "r_y2": 584.69321, "r_x3": 50.111977, "r_y3": 584.69321, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 605.55576, "r_x1": 286.36505, "r_y1": 605.55576, "r_x2": 286.36505, "r_y2": 596.6492000000001, "r_x3": 50.111977, "r_y3": 596.6492000000001, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 617.51076, "r_x1": 286.36505, "r_y1": 617.51076, "r_x2": 286.36505, "r_y2": 608.6042, "r_x3": 50.111977, "r_y3": 608.6042, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 629.46576, "r_x1": 286.36505, "r_y1": 629.46576, "r_x2": 286.36505, "r_y2": 620.5592, "r_x3": 50.111977, "r_y3": 620.5592, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 641.42076, "r_x1": 286.36508, "r_y1": 641.42076, "r_x2": 286.36508, "r_y2": 632.51421, "r_x3": 50.111977, "r_y3": 632.51421, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 653.37576, "r_x1": 286.36508, "r_y1": 653.37576, "r_x2": 286.36508, "r_y2": 644.46921, "r_x3": 50.111977, "r_y3": 644.46921, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 665.33077, "r_x1": 286.36502, "r_y1": 665.33077, "r_x2": 286.36502, "r_y2": 656.42421, "r_x3": 50.111977, "r_y3": 656.42421, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 677.28677, "r_x1": 286.36505, "r_y1": 677.28677, "r_x2": 286.36505, "r_y2": 668.3802000000001, "r_x3": 50.111977, "r_y3": 668.3802000000001, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 689.2417800000001, "r_x1": 286.36505, "r_y1": 689.2417800000001, "r_x2": 286.36505, "r_y2": 680.33521, "r_x3": 50.111977, "r_y3": 680.33521, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 701.196777, "r_x1": 286.36505, "r_y1": 701.196777, "r_x2": 286.36505, "r_y2": 692.290207, "r_x3": 50.111977, "r_y3": 692.290207, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 713.151779, "r_x1": 76.403275, "r_y1": 713.151779, "r_x2": 76.403275, "r_y2": 704.245209, "r_x3": 50.111977, "r_y3": 704.245209, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "section_header", "bbox": { "l": 315.56702, "t": 218.00684, "r": 408.4407, "b": 226.75482, "coord_origin": "TOPLEFT" }, "confidence": 0.6724023818969727, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 226.75482, "r_x1": 324.01007, "r_y1": 226.75482, "r_x2": 324.01007, "r_y2": 218.00684, "r_x3": 315.56702, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.2316, "r_y0": 226.75482, "r_x1": 408.4407, "r_y1": 226.75482, "r_x2": 408.4407, "r_y2": 218.00684, "r_x3": 328.2316, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "list_item", "bbox": { "l": 315.56702, "t": 313.69478999999995, "r": 486.40194999999994, "b": 333.2428, "coord_origin": "TOPLEFT" }, "confidence": 0.5549328923225403, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 322.44281, "r_x1": 325.05786, "r_y1": 322.44281, "r_x2": 325.05786, "r_y2": 313.69478999999995, "r_x3": 315.56702, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.80325, "r_y0": 322.44281, "r_x1": 486.40194999999994, "r_y1": 322.44281, "r_x2": 486.40194999999994, "r_y2": 313.69478999999995, "r_x3": 329.80325, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46252, "r_y0": 333.2428, "r_x1": 472.47411999999997, "r_y1": 333.2428, "r_x2": 472.47411999999997, "r_y2": 324.49478, "r_x3": 326.46252, "r_y3": 324.49478, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 315.56702, "t": 420.1828, "r": 491.1912500000001, "b": 428.93082, "coord_origin": "TOPLEFT" }, "confidence": 0.5501358509063721, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 428.93082, "r_x1": 324.81039, "r_y1": 428.93082, "r_x2": 324.81039, "r_y2": 420.1828, "r_x3": 315.56702, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.4321, "r_y0": 428.93082, "r_x1": 491.1912500000001, "r_y1": 428.93082, "r_x2": 491.1912500000001, "r_y2": 420.1828, "r_x3": 329.4321, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "picture", "bbox": { "l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT" }, "confidence": 0.8742761611938477, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.14752, "r_y0": 351.61322, "r_x1": 412.54001, "r_y1": 351.61322, "r_x2": 412.54001, "r_y2": 342.82828, "r_x3": 408.14752, "r_y3": 342.82828, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11011, "r_y0": 350.35712, "r_x1": 360.50259, "r_y1": 350.35712, "r_x2": 360.50259, "r_y2": 341.57217, "r_x3": 356.11011, "r_y3": 341.57217, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.6777, "r_y0": 349.7226299999999, "r_x1": 505.0701900000001, "r_y1": 349.7226299999999, "r_x2": 505.0701900000001, "r_y2": 340.93768, "r_x3": 500.6777, "r_y3": 340.93768, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13382, "r_y0": 360.53284, "r_x1": 360.52631, "r_y1": 360.53284, "r_x2": 360.52631, "r_y2": 351.74789, "r_x3": 356.13382, "r_y3": 351.74789, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.53992, "r_y0": 364.66144, "r_x1": 406.9324, "r_y1": 364.66144, "r_x2": 406.9324, "r_y2": 355.8765, "r_x3": 402.53992, "r_y3": 355.8765, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58178999999996, "r_y0": 361.62512, "r_x1": 452.97427, "r_y1": 361.62512, "r_x2": 452.97427, "r_y2": 352.84018, "r_x3": 448.58178999999996, "r_y3": 352.84018, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65161000000006, "r_y0": 362.49152, "r_x1": 496.0441, "r_y1": 362.49152, "r_x2": 496.0441, "r_y2": 353.70657, "r_x3": 491.65161000000006, "r_y3": 353.70657, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.13843, "r_y0": 362.12463, "r_x1": 539.53088, "r_y1": 362.12463, "r_x2": 539.53088, "r_y2": 353.33969, "r_x3": 535.13843, "r_y3": 353.33969, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.82822, "r_y0": 395.88275, "r_x1": 353.2207, "r_y1": 395.88275, "r_x2": 353.2207, "r_y2": 387.09781, "r_x3": 348.82822, "r_y3": 387.09781, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27151, "r_y0": 384.15723, "r_x1": 393.664, "r_y1": 384.15723, "r_x2": 393.664, "r_y2": 375.37228, "r_x3": 389.27151, "r_y3": 375.37228, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67479999999995, "r_y0": 384.43115, "r_x1": 451.45889000000005, "r_y1": 384.43115, "r_x2": 451.45889000000005, "r_y2": 375.64621, "r_x3": 442.67479999999995, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.4382299999999, "r_y0": 384.31894000000005, "r_x1": 485.90167, "r_y1": 384.31894000000005, "r_x2": 485.90167, "r_y2": 375.534, "r_x3": 477.4382299999999, "r_y3": 375.534, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57263, "r_y0": 384.43115, "r_x1": 531.35669, "r_y1": 384.43115, "r_x2": 531.35669, "r_y2": 375.64621, "r_x3": 522.57263, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.22992, "r_y0": 395.89923, "r_x1": 409.01401, "r_y1": 395.89923, "r_x2": 409.01401, "r_y2": 387.11429, "r_x3": 400.22992, "r_y3": 387.11429, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30792, "r_y0": 395.77475000000004, "r_x1": 451.0920100000001, "r_y1": 395.77475000000004, "r_x2": 451.0920100000001, "r_y2": 386.98981000000003, "r_x3": 442.30792, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.21941999999996, "r_y0": 396.15964, "r_x1": 487.00351000000006, "r_y1": 396.15964, "r_x2": 487.00351000000006, "r_y2": 387.37469, "r_x3": 478.21941999999996, "r_y3": 387.37469, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.2287, "r_y0": 395.77475000000004, "r_x1": 532.01276, "r_y1": 395.77475000000004, "r_x2": 532.01276, "r_y2": 386.98981000000003, "r_x3": 523.2287, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57233, "r_y0": 408.20972, "r_x1": 415.96481, "r_y1": 408.20972, "r_x2": 415.96481, "r_y2": 399.42477, "r_x3": 411.57233, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96393, "r_y0": 408.20972, "r_x1": 420.35641, "r_y1": 408.20972, "r_x2": 420.35641, "r_y2": 399.42477, "r_x3": 415.96393, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30521, "r_y0": 407.82213999999993, "r_x1": 451.08929, "r_y1": 407.82213999999993, "r_x2": 451.08929, "r_y2": 399.0371999999999, "r_x3": 442.30521, "r_y3": 399.0371999999999, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.77893, "r_y0": 407.78133999999994, "r_x1": 487.56302, "r_y1": 407.78133999999994, "r_x2": 487.56302, "r_y2": 398.99639999999994, "r_x3": 478.77893, "r_y3": 398.99639999999994, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97241, "r_y0": 407.39642, "r_x1": 532.75647, "r_y1": 407.39642, "r_x2": 532.75647, "r_y2": 398.6114799999999, "r_x3": 523.97241, "r_y3": 398.6114799999999, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09399, "r_y0": 367.89072, "r_x1": 391.09879, "r_y1": 367.89072, "r_x2": 391.09879, "r_y2": 357.76030999999995, "r_x3": 385.09399, "r_y3": 357.76030999999995, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43451, "r_y0": 390.85689999999994, "r_x1": 339.4393, "r_y1": 390.85689999999994, "r_x2": 339.4393, "r_y2": 380.7265, "r_x3": 333.43451, "r_y3": 380.7265, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07210999999995, "r_y0": 351.16720999999995, "r_x1": 484.0769, "r_y1": 351.16720999999995, "r_x2": 484.0769, "r_y2": 341.0368000000001, "r_x3": 478.07210999999995, "r_y3": 341.0368000000001, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 40, "label": "text", "bbox": { "l": 408.14752, "t": 342.82828, "r": 412.54001, "b": 351.61322, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.14752, "r_y0": 351.61322, "r_x1": 412.54001, "r_y1": 351.61322, "r_x2": 412.54001, "r_y2": 342.82828, "r_x3": 408.14752, "r_y3": 342.82828, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 356.11011, "t": 341.57217, "r": 360.50259, "b": 350.35712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11011, "r_y0": 350.35712, "r_x1": 360.50259, "r_y1": 350.35712, "r_x2": 360.50259, "r_y2": 341.57217, "r_x3": 356.11011, "r_y3": 341.57217, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 500.6777, "t": 340.93768, "r": 505.0701900000001, "b": 349.7226299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.6777, "r_y0": 349.7226299999999, "r_x1": 505.0701900000001, "r_y1": 349.7226299999999, "r_x2": 505.0701900000001, "r_y2": 340.93768, "r_x3": 500.6777, "r_y3": 340.93768, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 356.13382, "t": 351.74789, "r": 360.52631, "b": 360.53284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13382, "r_y0": 360.53284, "r_x1": 360.52631, "r_y1": 360.53284, "r_x2": 360.52631, "r_y2": 351.74789, "r_x3": 356.13382, "r_y3": 351.74789, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 402.53992, "t": 355.8765, "r": 406.9324, "b": 364.66144, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.53992, "r_y0": 364.66144, "r_x1": 406.9324, "r_y1": 364.66144, "r_x2": 406.9324, "r_y2": 355.8765, "r_x3": 402.53992, "r_y3": 355.8765, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 448.58178999999996, "t": 352.84018, "r": 452.97427, "b": 361.62512, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58178999999996, "r_y0": 361.62512, "r_x1": 452.97427, "r_y1": 361.62512, "r_x2": 452.97427, "r_y2": 352.84018, "r_x3": 448.58178999999996, "r_y3": 352.84018, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 491.65161000000006, "t": 353.70657, "r": 496.0441, "b": 362.49152, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65161000000006, "r_y0": 362.49152, "r_x1": 496.0441, "r_y1": 362.49152, "r_x2": 496.0441, "r_y2": 353.70657, "r_x3": 491.65161000000006, "r_y3": 353.70657, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 535.13843, "t": 353.33969, "r": 539.53088, "b": 362.12463, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.13843, "r_y0": 362.12463, "r_x1": 539.53088, "r_y1": 362.12463, "r_x2": 539.53088, "r_y2": 353.33969, "r_x3": 535.13843, "r_y3": 353.33969, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 348.82822, "t": 387.09781, "r": 353.2207, "b": 395.88275, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.82822, "r_y0": 395.88275, "r_x1": 353.2207, "r_y1": 395.88275, "r_x2": 353.2207, "r_y2": 387.09781, "r_x3": 348.82822, "r_y3": 387.09781, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 389.27151, "t": 375.37228, "r": 393.664, "b": 384.15723, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27151, "r_y0": 384.15723, "r_x1": 393.664, "r_y1": 384.15723, "r_x2": 393.664, "r_y2": 375.37228, "r_x3": 389.27151, "r_y3": 375.37228, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 442.67479999999995, "t": 375.64621, "r": 451.45889000000005, "b": 384.43115, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67479999999995, "r_y0": 384.43115, "r_x1": 451.45889000000005, "r_y1": 384.43115, "r_x2": 451.45889000000005, "r_y2": 375.64621, "r_x3": 442.67479999999995, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 477.4382299999999, "t": 375.534, "r": 485.90167, "b": 384.31894000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.4382299999999, "r_y0": 384.31894000000005, "r_x1": 485.90167, "r_y1": 384.31894000000005, "r_x2": 485.90167, "r_y2": 375.534, "r_x3": 477.4382299999999, "r_y3": 375.534, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 522.57263, "t": 375.64621, "r": 531.35669, "b": 384.43115, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57263, "r_y0": 384.43115, "r_x1": 531.35669, "r_y1": 384.43115, "r_x2": 531.35669, "r_y2": 375.64621, "r_x3": 522.57263, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 400.22992, "t": 387.11429, "r": 409.01401, "b": 395.89923, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.22992, "r_y0": 395.89923, "r_x1": 409.01401, "r_y1": 395.89923, "r_x2": 409.01401, "r_y2": 387.11429, "r_x3": 400.22992, "r_y3": 387.11429, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 442.30792, "t": 386.98981000000003, "r": 451.0920100000001, "b": 395.77475000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30792, "r_y0": 395.77475000000004, "r_x1": 451.0920100000001, "r_y1": 395.77475000000004, "r_x2": 451.0920100000001, "r_y2": 386.98981000000003, "r_x3": 442.30792, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 478.21941999999996, "t": 387.37469, "r": 487.00351000000006, "b": 396.15964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.21941999999996, "r_y0": 396.15964, "r_x1": 487.00351000000006, "r_y1": 396.15964, "r_x2": 487.00351000000006, "r_y2": 387.37469, "r_x3": 478.21941999999996, "r_y3": 387.37469, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 523.2287, "t": 386.98981000000003, "r": 532.01276, "b": 395.77475000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.2287, "r_y0": 395.77475000000004, "r_x1": 532.01276, "r_y1": 395.77475000000004, "r_x2": 532.01276, "r_y2": 386.98981000000003, "r_x3": 523.2287, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 411.57233, "t": 399.42477, "r": 415.96481, "b": 408.20972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57233, "r_y0": 408.20972, "r_x1": 415.96481, "r_y1": 408.20972, "r_x2": 415.96481, "r_y2": 399.42477, "r_x3": 411.57233, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 415.96393, "t": 399.42477, "r": 420.35641, "b": 408.20972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96393, "r_y0": 408.20972, "r_x1": 420.35641, "r_y1": 408.20972, "r_x2": 420.35641, "r_y2": 399.42477, "r_x3": 415.96393, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 442.30521, "t": 399.0371999999999, "r": 451.08929, "b": 407.82213999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30521, "r_y0": 407.82213999999993, "r_x1": 451.08929, "r_y1": 407.82213999999993, "r_x2": 451.08929, "r_y2": 399.0371999999999, "r_x3": 442.30521, "r_y3": 399.0371999999999, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 478.77893, "t": 398.99639999999994, "r": 487.56302, "b": 407.78133999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.77893, "r_y0": 407.78133999999994, "r_x1": 487.56302, "r_y1": 407.78133999999994, "r_x2": 487.56302, "r_y2": 398.99639999999994, "r_x3": 478.77893, "r_y3": 398.99639999999994, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 523.97241, "t": 398.6114799999999, "r": 532.75647, "b": 407.39642, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97241, "r_y0": 407.39642, "r_x1": 532.75647, "r_y1": 407.39642, "r_x2": 532.75647, "r_y2": 398.6114799999999, "r_x3": 523.97241, "r_y3": 398.6114799999999, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 385.09399, "t": 357.76030999999995, "r": 391.09879, "b": 367.89072, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09399, "r_y0": 367.89072, "r_x1": 391.09879, "r_y1": 367.89072, "r_x2": 391.09879, "r_y2": 357.76030999999995, "r_x3": 385.09399, "r_y3": 357.76030999999995, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 333.43451, "t": 380.7265, "r": 339.4393, "b": 390.85689999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43451, "r_y0": 390.85689999999994, "r_x1": 339.4393, "r_y1": 390.85689999999994, "r_x2": 339.4393, "r_y2": 380.7265, "r_x3": 333.43451, "r_y3": 380.7265, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 478.07210999999995, "t": 341.0368000000001, "r": 484.0769, "b": 351.16720999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07210999999995, "r_y0": 351.16720999999995, "r_x1": 484.0769, "r_y1": 351.16720999999995, "r_x2": 484.0769, "r_y2": 341.0368000000001, "r_x3": 478.07210999999995, "r_y3": 341.0368000000001, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 23, "label": "picture", "bbox": { "l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT" }, "confidence": 0.5088632702827454, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.10422, "t": 437.68588, "r": 398.4967, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.24872, "t": 449.5455, "r": 351.6412, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.70102, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.90424, "t": 473.32291, "r": 337.90903, "b": 483.45331, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.87621999999993, "t": 437.5936, "r": 465.88101, "b": 447.724, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 11, "label": "table", "bbox": { "l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT" }, "confidence": 0.8056110739707947, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.10422, "t": 437.68588, "r": 398.4967, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.24872, "t": 449.5455, "r": 351.6412, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.70102, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.90424, "t": 473.32291, "r": 337.90903, "b": 483.45331, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.87621999999993, "t": 437.5936, "r": 465.88101, "b": 447.724, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 16, "label": "picture", "bbox": { "l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT" }, "confidence": 0.608779788017273, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.19681, "t": 269.35266, "r": 337.2016, "b": 279.48308999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.0329, "t": 252.67895999999996, "r": 390.03769, "b": 262.80939, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 15, "label": "table", "bbox": { "l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT" }, "confidence": 0.6515864729881287, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.19681, "t": 269.35266, "r": 337.2016, "b": 279.48308999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.0329, "t": 252.67895999999996, "r": 390.03769, "b": 262.80939, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 6, "label": "caption", "bbox": { "l": 308.862, "t": 514.50037, "r": 545.11517, "b": 559.2729, "coord_origin": "TOPLEFT" }, "confidence": 0.9214619398117065, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 523.40692, "r_x1": 345.73361, "r_y1": 523.40692, "r_x2": 345.73361, "r_y2": 514.50037, "r_x3": 308.862, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.17566, "r_y0": 523.40692, "r_x1": 545.11511, "r_y1": 523.40692, "r_x2": 545.11511, "r_y2": 514.50037, "r_x3": 353.17566, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 535.3619100000001, "r_x1": 545.11511, "r_y1": 535.3619100000001, "r_x2": 545.11511, "r_y2": 526.45535, "r_x3": 308.862, "r_y3": 526.45535, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 547.31691, "r_x1": 545.11517, "r_y1": 547.31691, "r_x2": 545.11517, "r_y2": 538.41035, "r_x3": 308.862, "r_y3": 538.41035, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 559.2729, "r_x1": 505.6917700000001, "r_y1": 559.2729, "r_x2": 505.6917700000001, "r_y2": 550.36635, "r_x3": 308.862, "r_y3": 550.36635, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 584.40936, "r": 545.11517, "b": 665.04693, "coord_origin": "TOPLEFT" }, "confidence": 0.9848759770393372, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 593.31592, "r_x1": 545.11493, "r_y1": 593.31592, "r_x2": 545.11493, "r_y2": 584.40936, "r_x3": 320.81699, "r_y3": 584.40936, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2709199999999, "r_x1": 545.11517, "r_y1": 605.2709199999999, "r_x2": 545.11517, "r_y2": 596.36436, "r_x3": 308.862, "r_y3": 596.36436, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.22592, "r_x1": 545.11511, "r_y1": 617.22592, "r_x2": 545.11511, "r_y2": 608.31937, "r_x3": 308.862, "r_y3": 608.31937, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.18092, "r_x1": 545.11505, "r_y1": 629.18092, "r_x2": 545.11505, "r_y2": 620.27437, "r_x3": 308.862, "r_y3": 620.27437, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.13692, "r_x1": 353.6937, "r_y1": 641.13692, "r_x2": 353.6937, "r_y2": 632.23036, "r_x3": 308.862, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11209, "r_y0": 641.13692, "r_x1": 374.66617, "r_y1": 641.13692, "r_x2": 374.66617, "r_y2": 632.23036, "r_x3": 362.11209, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.35785, "r_y0": 641.13692, "r_x1": 545.11505, "r_y1": 641.13692, "r_x2": 545.11505, "r_y2": 632.23036, "r_x3": 377.35785, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.09192, "r_x1": 545.11517, "r_y1": 653.09192, "r_x2": 545.11517, "r_y2": 644.18536, "r_x3": 308.862, "r_y3": 644.18536, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.04693, "r_x1": 375.55167, "r_y1": 665.04693, "r_x2": 375.55167, "r_y2": 656.14037, "r_x3": 308.862, "r_y3": 656.14037, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.862, "t": 668.38036, "r": 545.11511, "b": 713.151932, "coord_origin": "TOPLEFT" }, "confidence": 0.979152262210846, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 677.28693, "r_x1": 545.11493, "r_y1": 677.28693, "r_x2": 545.11493, "r_y2": 668.38036, "r_x3": 320.81699, "r_y3": 668.38036, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24193, "r_x1": 545.11511, "r_y1": 689.24193, "r_x2": 545.11511, "r_y2": 680.33536, "r_x3": 308.862, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.19693, "r_x1": 545.11511, "r_y1": 701.19693, "r_x2": 545.11511, "r_y2": 692.290359, "r_x3": 308.862, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151932, "r_x1": 545.11499, "r_y1": 713.151932, "r_x2": 545.11499, "r_y2": 704.245361, "r_x3": 308.862, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133366, "r": 300.10229, "b": 743.039928, "coord_origin": "TOPLEFT" }, "confidence": 0.8045893311500549, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 18.340221, "t": 207.82001000000002, "r": 36.339779, "b": 560.00003, "coord_origin": "TOPLEFT" }, "confidence": 0.8773143887519836, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340221, "r_y0": 560.00003, "r_x1": 36.339779, "r_y1": 560.00003, "r_x2": 36.339779, "r_y2": 207.82001000000002, "r_x3": 18.340221, "r_y3": 207.82001000000002, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "11": { "label": "table", "id": 11, "page_no": 0, "cluster": { "id": 11, "label": "table", "bbox": { "l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT" }, "confidence": 0.8056110739707947, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.10422, "t": 437.68588, "r": 398.4967, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.24872, "t": 449.5455, "r": 351.6412, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.70102, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.90424, "t": 473.32291, "r": 337.90903, "b": 483.45331, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.87621999999993, "t": 437.5936, "r": 465.88101, "b": 447.724, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 5, "table_cells": [ { "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false } ] }, "15": { "label": "table", "id": 15, "page_no": 0, "cluster": { "id": 15, "label": "table", "bbox": { "l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT" }, "confidence": 0.6515864729881287, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.19681, "t": 269.35266, "r": 337.2016, "b": 279.48308999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.0329, "t": 252.67895999999996, "r": 390.03769, "b": 262.80939, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 1, "num_cols": 1, "table_cells": [ { "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 8, "page_no": 0, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 96.301003, "t": 107.03412000000003, "r": 498.92708999999996, "b": 119.93133999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.8868067860603333, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.301003, "r_y0": 119.93133999999998, "r_x1": 498.92708999999996, "r_y1": 119.93133999999998, "r_x2": 498.92708999999996, "r_y2": 107.03412000000003, "r_x3": 96.301003, "r_y3": 107.03412000000003, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers." }, { "label": "section_header", "id": 13, "page_no": 0, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 142.47701, "t": 146.68535999999995, "r": 452.75027, "b": 171.32037000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.7586215734481812, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.47701, "r_y0": 157.37334999999996, "r_x1": 452.75027, "r_y1": 157.37334999999996, "r_x2": 452.75027, "r_y2": 146.68535999999995, "r_x3": 142.47701, "r_y3": 146.68535999999995, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.918, "r_y0": 171.32037000000003, "r_x1": 332.30597, "r_y1": 171.32037000000003, "r_x2": 332.30597, "r_y2": 160.63239, "r_x3": 262.918, "r_y3": 160.63239, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research" }, { "label": "key_value_region", "id": 25, "page_no": 0, "cluster": { "id": 25, "label": "key_value_region", "bbox": { "l": 208.123, "t": 175.96123999999998, "r": 378.73257, "b": 184.42553999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.4854728579521179, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.123, "r_y0": 184.42553999999996, "r_x1": 212.73083, "r_y1": 184.42553999999996, "r_x2": 212.73083, "r_y2": 175.96123999999998, "r_x3": 208.123, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.00409000000002, "r_x1": 293.42761, "r_y1": 184.00409000000002, "r_x2": 293.42761, "r_y2": 177.08203000000003, "r_x3": 212.73, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.42798, "r_y0": 184.42553999999996, "r_x1": 298.0358, "r_y1": 184.42553999999996, "r_x2": 298.0358, "r_y2": 175.96123999999998, "r_x3": 293.42798, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03497, "r_y0": 184.00409000000002, "r_x1": 378.73257, "r_y1": 184.00409000000002, "r_x2": 378.73257, "r_y2": 177.08203000000003, "r_x3": 298.03497, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 208.123, "t": 175.96123999999998, "r": 378.73257, "b": 184.42553999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9096331596374512, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.123, "r_y0": 184.42553999999996, "r_x1": 212.73083, "r_y1": 184.42553999999996, "r_x2": 212.73083, "r_y2": 175.96123999999998, "r_x3": 208.123, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.00409000000002, "r_x1": 293.42761, "r_y1": 184.00409000000002, "r_x2": 293.42761, "r_y2": 177.08203000000003, "r_x3": 212.73, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.42798, "r_y0": 184.42553999999996, "r_x1": 298.0358, "r_y1": 184.42553999999996, "r_x2": 298.0358, "r_y2": 175.96123999999998, "r_x3": 293.42798, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03497, "r_y0": 184.00409000000002, "r_x1": 378.73257, "r_y1": 184.00409000000002, "r_x2": 378.73257, "r_y2": 177.08203000000003, "r_x3": 298.03497, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 145.99498, "t": 215.48297000000002, "r": 190.48029, "b": 226.23071000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9258671402931213, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99498, "r_y0": 226.23071000000004, "r_x1": 190.48029, "r_y1": 226.23071000000004, "r_x2": 190.48029, "r_y2": 215.48297000000002, "r_x3": 145.99498, "r_y3": 215.48297000000002, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract" }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.111977, "t": 241.39508, "r": 286.36511, "b": 512.9966400000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9838882088661194, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 249.98284999999998, "r_x1": 286.36493, "r_y1": 249.98284999999998, "r_x2": 286.36493, "r_y2": 241.39508, "r_x3": 62.066978, "r_y3": 241.39508, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 261.93787, "r_x1": 286.36508, "r_y1": 261.93787, "r_x2": 286.36508, "r_y2": 253.3501, "r_x3": 50.111977, "r_y3": 253.3501, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 273.89288, "r_x1": 286.36508, "r_y1": 273.89288, "r_x2": 286.36508, "r_y2": 265.30511, "r_x3": 50.111977, "r_y3": 265.30511, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 285.84888, "r_x1": 286.36505, "r_y1": 285.84888, "r_x2": 286.36505, "r_y2": 277.26111000000003, "r_x3": 50.111977, "r_y3": 277.26111000000003, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 297.80386, "r_x1": 286.36505, "r_y1": 297.80386, "r_x2": 286.36505, "r_y2": 289.21609, "r_x3": 50.111977, "r_y3": 289.21609, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 309.75884999999994, "r_x1": 286.36505, "r_y1": 309.75884999999994, "r_x2": 286.36505, "r_y2": 301.17108, "r_x3": 50.111977, "r_y3": 301.17108, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 321.71384, "r_x1": 286.36508, "r_y1": 321.71384, "r_x2": 286.36508, "r_y2": 313.12607, "r_x3": 50.111977, "r_y3": 313.12607, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 333.66882, "r_x1": 286.36508, "r_y1": 333.66882, "r_x2": 286.36508, "r_y2": 325.08105, "r_x3": 50.111977, "r_y3": 325.08105, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 345.62381, "r_x1": 286.36505, "r_y1": 345.62381, "r_x2": 286.36505, "r_y2": 337.03604, "r_x3": 50.111977, "r_y3": 337.03604, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 357.5798, "r_x1": 286.36508, "r_y1": 357.5798, "r_x2": 286.36508, "r_y2": 348.99203, "r_x3": 50.111977, "r_y3": 348.99203, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 369.53479, "r_x1": 286.36505, "r_y1": 369.53479, "r_x2": 286.36505, "r_y2": 360.94701999999995, "r_x3": 50.111977, "r_y3": 360.94701999999995, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 381.48978, "r_x1": 286.36508, "r_y1": 381.48978, "r_x2": 286.36508, "r_y2": 372.90201, "r_x3": 50.111977, "r_y3": 372.90201, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 393.44476, "r_x1": 286.36505, "r_y1": 393.44476, "r_x2": 286.36505, "r_y2": 384.85699, "r_x3": 50.111977, "r_y3": 384.85699, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 405.39975000000004, "r_x1": 286.36511, "r_y1": 405.39975000000004, "r_x2": 286.36511, "r_y2": 396.81198, "r_x3": 50.111977, "r_y3": 396.81198, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 417.35474, "r_x1": 286.36508, "r_y1": 417.35474, "r_x2": 286.36508, "r_y2": 408.76697, "r_x3": 50.111977, "r_y3": 408.76697, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 429.31073, "r_x1": 286.36505, "r_y1": 429.31073, "r_x2": 286.36505, "r_y2": 420.72296000000006, "r_x3": 50.111977, "r_y3": 420.72296000000006, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 441.26572, "r_x1": 207.23216, "r_y1": 441.26572, "r_x2": 207.23216, "r_y2": 432.67795, "r_x3": 50.111977, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.09639, "r_y0": 441.26572, "r_x1": 286.36508, "r_y1": 441.26572, "r_x2": 286.36508, "r_y2": 432.67795, "r_x3": 214.09639, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 453.2207, "r_x1": 286.36508, "r_y1": 453.2207, "r_x2": 286.36508, "r_y2": 444.63293, "r_x3": 50.111977, "r_y3": 444.63293, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 465.17569, "r_x1": 286.36505, "r_y1": 465.17569, "r_x2": 286.36505, "r_y2": 456.58792000000005, "r_x3": 50.111977, "r_y3": 456.58792000000005, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 477.13068, "r_x1": 286.36505, "r_y1": 477.13068, "r_x2": 286.36505, "r_y2": 468.54291, "r_x3": 50.111977, "r_y3": 468.54291, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 489.08667, "r_x1": 286.36508, "r_y1": 489.08667, "r_x2": 286.36508, "r_y2": 480.4989, "r_x3": 50.111977, "r_y3": 480.4989, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 501.04166, "r_x1": 286.36505, "r_y1": 501.04166, "r_x2": 286.36505, "r_y2": 492.45389, "r_x3": 50.111977, "r_y3": 492.45389, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 512.9966400000001, "r_x1": 276.65152, "r_y1": 512.9966400000001, "r_x2": 276.65152, "r_y2": 504.40887, "r_x3": 50.111977, "r_y3": 504.40887, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables." }, { "label": "section_header", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 50.111977, "t": 539.94276, "r": 126.94804, "b": 550.69049, "coord_origin": "TOPLEFT" }, "confidence": 0.9317677617073059, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 550.69049, "r_x1": 58.121296, "r_y1": 550.69049, "r_x2": 58.121296, "r_y2": 539.94276, "r_x3": 50.111977, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.800385, "r_y0": 550.69049, "r_x1": 126.94804, "r_y1": 550.69049, "r_x2": 126.94804, "r_y2": 539.94276, "r_x3": 68.800385, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Introduction" }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.111977, "t": 560.7832, "r": 286.36508, "b": 713.151779, "coord_origin": "TOPLEFT" }, "confidence": 0.9841895699501038, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 569.68976, "r_x1": 286.36496, "r_y1": 569.68976, "r_x2": 286.36496, "r_y2": 560.7832, "r_x3": 62.066978, "r_y3": 560.7832, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 581.64476, "r_x1": 286.36508, "r_y1": 581.64476, "r_x2": 286.36508, "r_y2": 572.7382, "r_x3": 50.111977, "r_y3": 572.7382, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 593.5997600000001, "r_x1": 286.36505, "r_y1": 593.5997600000001, "r_x2": 286.36505, "r_y2": 584.69321, "r_x3": 50.111977, "r_y3": 584.69321, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 605.55576, "r_x1": 286.36505, "r_y1": 605.55576, "r_x2": 286.36505, "r_y2": 596.6492000000001, "r_x3": 50.111977, "r_y3": 596.6492000000001, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 617.51076, "r_x1": 286.36505, "r_y1": 617.51076, "r_x2": 286.36505, "r_y2": 608.6042, "r_x3": 50.111977, "r_y3": 608.6042, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 629.46576, "r_x1": 286.36505, "r_y1": 629.46576, "r_x2": 286.36505, "r_y2": 620.5592, "r_x3": 50.111977, "r_y3": 620.5592, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 641.42076, "r_x1": 286.36508, "r_y1": 641.42076, "r_x2": 286.36508, "r_y2": 632.51421, "r_x3": 50.111977, "r_y3": 632.51421, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 653.37576, "r_x1": 286.36508, "r_y1": 653.37576, "r_x2": 286.36508, "r_y2": 644.46921, "r_x3": 50.111977, "r_y3": 644.46921, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 665.33077, "r_x1": 286.36502, "r_y1": 665.33077, "r_x2": 286.36502, "r_y2": 656.42421, "r_x3": 50.111977, "r_y3": 656.42421, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 677.28677, "r_x1": 286.36505, "r_y1": 677.28677, "r_x2": 286.36505, "r_y2": 668.3802000000001, "r_x3": 50.111977, "r_y3": 668.3802000000001, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 689.2417800000001, "r_x1": 286.36505, "r_y1": 689.2417800000001, "r_x2": 286.36505, "r_y2": 680.33521, "r_x3": 50.111977, "r_y3": 680.33521, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 701.196777, "r_x1": 286.36505, "r_y1": 701.196777, "r_x2": 286.36505, "r_y2": 692.290207, "r_x3": 50.111977, "r_y3": 692.290207, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 713.151779, "r_x1": 76.403275, "r_y1": 713.151779, "r_x2": 76.403275, "r_y2": 704.245209, "r_x3": 50.111977, "r_y3": 704.245209, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues." }, { "label": "section_header", "id": 14, "page_no": 0, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 315.56702, "t": 218.00684, "r": 408.4407, "b": 226.75482, "coord_origin": "TOPLEFT" }, "confidence": 0.6724023818969727, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 226.75482, "r_x1": 324.01007, "r_y1": 226.75482, "r_x2": 324.01007, "r_y2": 218.00684, "r_x3": 315.56702, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.2316, "r_y0": 226.75482, "r_x1": 408.4407, "r_y1": 226.75482, "r_x2": 408.4407, "r_y2": 218.00684, "r_x3": 328.2316, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a. Picture of a table:" }, { "label": "list_item", "id": 17, "page_no": 0, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 315.56702, "t": 313.69478999999995, "r": 486.40194999999994, "b": 333.2428, "coord_origin": "TOPLEFT" }, "confidence": 0.5549328923225403, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 322.44281, "r_x1": 325.05786, "r_y1": 322.44281, "r_x2": 325.05786, "r_y2": 313.69478999999995, "r_x3": 315.56702, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.80325, "r_y0": 322.44281, "r_x1": 486.40194999999994, "r_y1": 322.44281, "r_x2": 486.40194999999994, "r_y2": 313.69478999999995, "r_x3": 329.80325, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46252, "r_y0": 333.2428, "r_x1": 472.47411999999997, "r_y1": 333.2428, "r_x2": 472.47411999999997, "r_y2": 324.49478, "r_x3": 326.46252, "r_y3": 324.49478, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer" }, { "label": "list_item", "id": 18, "page_no": 0, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 315.56702, "t": 420.1828, "r": 491.1912500000001, "b": 428.93082, "coord_origin": "TOPLEFT" }, "confidence": 0.5501358509063721, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 428.93082, "r_x1": 324.81039, "r_y1": 428.93082, "r_x2": 324.81039, "r_y2": 420.1828, "r_x3": 315.56702, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.4321, "r_y0": 428.93082, "r_x1": 491.1912500000001, "r_y1": 428.93082, "r_x2": 491.1912500000001, "r_y2": 420.1828, "r_x3": 329.4321, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "c. Structure predicted by TableFormer:" }, { "label": "picture", "id": 10, "page_no": 0, "cluster": { "id": 10, "label": "picture", "bbox": { "l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT" }, "confidence": 0.8742761611938477, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.14752, "r_y0": 351.61322, "r_x1": 412.54001, "r_y1": 351.61322, "r_x2": 412.54001, "r_y2": 342.82828, "r_x3": 408.14752, "r_y3": 342.82828, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11011, "r_y0": 350.35712, "r_x1": 360.50259, "r_y1": 350.35712, "r_x2": 360.50259, "r_y2": 341.57217, "r_x3": 356.11011, "r_y3": 341.57217, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.6777, "r_y0": 349.7226299999999, "r_x1": 505.0701900000001, "r_y1": 349.7226299999999, "r_x2": 505.0701900000001, "r_y2": 340.93768, "r_x3": 500.6777, "r_y3": 340.93768, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13382, "r_y0": 360.53284, "r_x1": 360.52631, "r_y1": 360.53284, "r_x2": 360.52631, "r_y2": 351.74789, "r_x3": 356.13382, "r_y3": 351.74789, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.53992, "r_y0": 364.66144, "r_x1": 406.9324, "r_y1": 364.66144, "r_x2": 406.9324, "r_y2": 355.8765, "r_x3": 402.53992, "r_y3": 355.8765, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58178999999996, "r_y0": 361.62512, "r_x1": 452.97427, "r_y1": 361.62512, "r_x2": 452.97427, "r_y2": 352.84018, "r_x3": 448.58178999999996, "r_y3": 352.84018, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65161000000006, "r_y0": 362.49152, "r_x1": 496.0441, "r_y1": 362.49152, "r_x2": 496.0441, "r_y2": 353.70657, "r_x3": 491.65161000000006, "r_y3": 353.70657, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.13843, "r_y0": 362.12463, "r_x1": 539.53088, "r_y1": 362.12463, "r_x2": 539.53088, "r_y2": 353.33969, "r_x3": 535.13843, "r_y3": 353.33969, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.82822, "r_y0": 395.88275, "r_x1": 353.2207, "r_y1": 395.88275, "r_x2": 353.2207, "r_y2": 387.09781, "r_x3": 348.82822, "r_y3": 387.09781, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27151, "r_y0": 384.15723, "r_x1": 393.664, "r_y1": 384.15723, "r_x2": 393.664, "r_y2": 375.37228, "r_x3": 389.27151, "r_y3": 375.37228, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67479999999995, "r_y0": 384.43115, "r_x1": 451.45889000000005, "r_y1": 384.43115, "r_x2": 451.45889000000005, "r_y2": 375.64621, "r_x3": 442.67479999999995, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.4382299999999, "r_y0": 384.31894000000005, "r_x1": 485.90167, "r_y1": 384.31894000000005, "r_x2": 485.90167, "r_y2": 375.534, "r_x3": 477.4382299999999, "r_y3": 375.534, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57263, "r_y0": 384.43115, "r_x1": 531.35669, "r_y1": 384.43115, "r_x2": 531.35669, "r_y2": 375.64621, "r_x3": 522.57263, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.22992, "r_y0": 395.89923, "r_x1": 409.01401, "r_y1": 395.89923, "r_x2": 409.01401, "r_y2": 387.11429, "r_x3": 400.22992, "r_y3": 387.11429, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30792, "r_y0": 395.77475000000004, "r_x1": 451.0920100000001, "r_y1": 395.77475000000004, "r_x2": 451.0920100000001, "r_y2": 386.98981000000003, "r_x3": 442.30792, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.21941999999996, "r_y0": 396.15964, "r_x1": 487.00351000000006, "r_y1": 396.15964, "r_x2": 487.00351000000006, "r_y2": 387.37469, "r_x3": 478.21941999999996, "r_y3": 387.37469, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.2287, "r_y0": 395.77475000000004, "r_x1": 532.01276, "r_y1": 395.77475000000004, "r_x2": 532.01276, "r_y2": 386.98981000000003, "r_x3": 523.2287, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57233, "r_y0": 408.20972, "r_x1": 415.96481, "r_y1": 408.20972, "r_x2": 415.96481, "r_y2": 399.42477, "r_x3": 411.57233, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96393, "r_y0": 408.20972, "r_x1": 420.35641, "r_y1": 408.20972, "r_x2": 420.35641, "r_y2": 399.42477, "r_x3": 415.96393, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30521, "r_y0": 407.82213999999993, "r_x1": 451.08929, "r_y1": 407.82213999999993, "r_x2": 451.08929, "r_y2": 399.0371999999999, "r_x3": 442.30521, "r_y3": 399.0371999999999, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.77893, "r_y0": 407.78133999999994, "r_x1": 487.56302, "r_y1": 407.78133999999994, "r_x2": 487.56302, "r_y2": 398.99639999999994, "r_x3": 478.77893, "r_y3": 398.99639999999994, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97241, "r_y0": 407.39642, "r_x1": 532.75647, "r_y1": 407.39642, "r_x2": 532.75647, "r_y2": 398.6114799999999, "r_x3": 523.97241, "r_y3": 398.6114799999999, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09399, "r_y0": 367.89072, "r_x1": 391.09879, "r_y1": 367.89072, "r_x2": 391.09879, "r_y2": 357.76030999999995, "r_x3": 385.09399, "r_y3": 357.76030999999995, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43451, "r_y0": 390.85689999999994, "r_x1": 339.4393, "r_y1": 390.85689999999994, "r_x2": 339.4393, "r_y2": 380.7265, "r_x3": 333.43451, "r_y3": 380.7265, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07210999999995, "r_y0": 351.16720999999995, "r_x1": 484.0769, "r_y1": 351.16720999999995, "r_x2": 484.0769, "r_y2": 341.0368000000001, "r_x3": 478.07210999999995, "r_y3": 341.0368000000001, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 40, "label": "text", "bbox": { "l": 408.14752, "t": 342.82828, "r": 412.54001, "b": 351.61322, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.14752, "r_y0": 351.61322, "r_x1": 412.54001, "r_y1": 351.61322, "r_x2": 412.54001, "r_y2": 342.82828, "r_x3": 408.14752, "r_y3": 342.82828, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 356.11011, "t": 341.57217, "r": 360.50259, "b": 350.35712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11011, "r_y0": 350.35712, "r_x1": 360.50259, "r_y1": 350.35712, "r_x2": 360.50259, "r_y2": 341.57217, "r_x3": 356.11011, "r_y3": 341.57217, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 500.6777, "t": 340.93768, "r": 505.0701900000001, "b": 349.7226299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.6777, "r_y0": 349.7226299999999, "r_x1": 505.0701900000001, "r_y1": 349.7226299999999, "r_x2": 505.0701900000001, "r_y2": 340.93768, "r_x3": 500.6777, "r_y3": 340.93768, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 356.13382, "t": 351.74789, "r": 360.52631, "b": 360.53284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13382, "r_y0": 360.53284, "r_x1": 360.52631, "r_y1": 360.53284, "r_x2": 360.52631, "r_y2": 351.74789, "r_x3": 356.13382, "r_y3": 351.74789, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 402.53992, "t": 355.8765, "r": 406.9324, "b": 364.66144, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.53992, "r_y0": 364.66144, "r_x1": 406.9324, "r_y1": 364.66144, "r_x2": 406.9324, "r_y2": 355.8765, "r_x3": 402.53992, "r_y3": 355.8765, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 448.58178999999996, "t": 352.84018, "r": 452.97427, "b": 361.62512, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58178999999996, "r_y0": 361.62512, "r_x1": 452.97427, "r_y1": 361.62512, "r_x2": 452.97427, "r_y2": 352.84018, "r_x3": 448.58178999999996, "r_y3": 352.84018, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 491.65161000000006, "t": 353.70657, "r": 496.0441, "b": 362.49152, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65161000000006, "r_y0": 362.49152, "r_x1": 496.0441, "r_y1": 362.49152, "r_x2": 496.0441, "r_y2": 353.70657, "r_x3": 491.65161000000006, "r_y3": 353.70657, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 535.13843, "t": 353.33969, "r": 539.53088, "b": 362.12463, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.13843, "r_y0": 362.12463, "r_x1": 539.53088, "r_y1": 362.12463, "r_x2": 539.53088, "r_y2": 353.33969, "r_x3": 535.13843, "r_y3": 353.33969, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 348.82822, "t": 387.09781, "r": 353.2207, "b": 395.88275, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.82822, "r_y0": 395.88275, "r_x1": 353.2207, "r_y1": 395.88275, "r_x2": 353.2207, "r_y2": 387.09781, "r_x3": 348.82822, "r_y3": 387.09781, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 389.27151, "t": 375.37228, "r": 393.664, "b": 384.15723, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27151, "r_y0": 384.15723, "r_x1": 393.664, "r_y1": 384.15723, "r_x2": 393.664, "r_y2": 375.37228, "r_x3": 389.27151, "r_y3": 375.37228, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 442.67479999999995, "t": 375.64621, "r": 451.45889000000005, "b": 384.43115, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67479999999995, "r_y0": 384.43115, "r_x1": 451.45889000000005, "r_y1": 384.43115, "r_x2": 451.45889000000005, "r_y2": 375.64621, "r_x3": 442.67479999999995, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 477.4382299999999, "t": 375.534, "r": 485.90167, "b": 384.31894000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.4382299999999, "r_y0": 384.31894000000005, "r_x1": 485.90167, "r_y1": 384.31894000000005, "r_x2": 485.90167, "r_y2": 375.534, "r_x3": 477.4382299999999, "r_y3": 375.534, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 522.57263, "t": 375.64621, "r": 531.35669, "b": 384.43115, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57263, "r_y0": 384.43115, "r_x1": 531.35669, "r_y1": 384.43115, "r_x2": 531.35669, "r_y2": 375.64621, "r_x3": 522.57263, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 400.22992, "t": 387.11429, "r": 409.01401, "b": 395.89923, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.22992, "r_y0": 395.89923, "r_x1": 409.01401, "r_y1": 395.89923, "r_x2": 409.01401, "r_y2": 387.11429, "r_x3": 400.22992, "r_y3": 387.11429, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 442.30792, "t": 386.98981000000003, "r": 451.0920100000001, "b": 395.77475000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30792, "r_y0": 395.77475000000004, "r_x1": 451.0920100000001, "r_y1": 395.77475000000004, "r_x2": 451.0920100000001, "r_y2": 386.98981000000003, "r_x3": 442.30792, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 478.21941999999996, "t": 387.37469, "r": 487.00351000000006, "b": 396.15964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.21941999999996, "r_y0": 396.15964, "r_x1": 487.00351000000006, "r_y1": 396.15964, "r_x2": 487.00351000000006, "r_y2": 387.37469, "r_x3": 478.21941999999996, "r_y3": 387.37469, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 523.2287, "t": 386.98981000000003, "r": 532.01276, "b": 395.77475000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.2287, "r_y0": 395.77475000000004, "r_x1": 532.01276, "r_y1": 395.77475000000004, "r_x2": 532.01276, "r_y2": 386.98981000000003, "r_x3": 523.2287, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 411.57233, "t": 399.42477, "r": 415.96481, "b": 408.20972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57233, "r_y0": 408.20972, "r_x1": 415.96481, "r_y1": 408.20972, "r_x2": 415.96481, "r_y2": 399.42477, "r_x3": 411.57233, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 415.96393, "t": 399.42477, "r": 420.35641, "b": 408.20972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96393, "r_y0": 408.20972, "r_x1": 420.35641, "r_y1": 408.20972, "r_x2": 420.35641, "r_y2": 399.42477, "r_x3": 415.96393, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 442.30521, "t": 399.0371999999999, "r": 451.08929, "b": 407.82213999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30521, "r_y0": 407.82213999999993, "r_x1": 451.08929, "r_y1": 407.82213999999993, "r_x2": 451.08929, "r_y2": 399.0371999999999, "r_x3": 442.30521, "r_y3": 399.0371999999999, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 478.77893, "t": 398.99639999999994, "r": 487.56302, "b": 407.78133999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.77893, "r_y0": 407.78133999999994, "r_x1": 487.56302, "r_y1": 407.78133999999994, "r_x2": 487.56302, "r_y2": 398.99639999999994, "r_x3": 478.77893, "r_y3": 398.99639999999994, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 523.97241, "t": 398.6114799999999, "r": 532.75647, "b": 407.39642, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97241, "r_y0": 407.39642, "r_x1": 532.75647, "r_y1": 407.39642, "r_x2": 532.75647, "r_y2": 398.6114799999999, "r_x3": 523.97241, "r_y3": 398.6114799999999, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 385.09399, "t": 357.76030999999995, "r": 391.09879, "b": 367.89072, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09399, "r_y0": 367.89072, "r_x1": 391.09879, "r_y1": 367.89072, "r_x2": 391.09879, "r_y2": 357.76030999999995, "r_x3": 385.09399, "r_y3": 357.76030999999995, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 333.43451, "t": 380.7265, "r": 339.4393, "b": 390.85689999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43451, "r_y0": 390.85689999999994, "r_x1": 339.4393, "r_y1": 390.85689999999994, "r_x2": 339.4393, "r_y2": 380.7265, "r_x3": 333.43451, "r_y3": 380.7265, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 478.07210999999995, "t": 341.0368000000001, "r": 484.0769, "b": 351.16720999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07210999999995, "r_y0": 351.16720999999995, "r_x1": 484.0769, "r_y1": 351.16720999999995, "r_x2": 484.0769, "r_y2": 341.0368000000001, "r_x3": 478.07210999999995, "r_y3": 341.0368000000001, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 23, "page_no": 0, "cluster": { "id": 23, "label": "picture", "bbox": { "l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT" }, "confidence": 0.5088632702827454, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.10422, "t": 437.68588, "r": 398.4967, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.24872, "t": 449.5455, "r": 351.6412, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.70102, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.90424, "t": 473.32291, "r": 337.90903, "b": 483.45331, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.87621999999993, "t": 437.5936, "r": 465.88101, "b": 447.724, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 0, "cluster": { "id": 11, "label": "table", "bbox": { "l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT" }, "confidence": 0.8056110739707947, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.10422, "t": 437.68588, "r": 398.4967, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.24872, "t": 449.5455, "r": 351.6412, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.70102, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.90424, "t": 473.32291, "r": 337.90903, "b": 483.45331, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.87621999999993, "t": 437.5936, "r": 465.88101, "b": 447.724, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 5, "table_cells": [ { "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "picture", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "picture", "bbox": { "l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT" }, "confidence": 0.608779788017273, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.19681, "t": 269.35266, "r": 337.2016, "b": 279.48308999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.0329, "t": 252.67895999999996, "r": 390.03769, "b": 262.80939, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 15, "page_no": 0, "cluster": { "id": 15, "label": "table", "bbox": { "l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT" }, "confidence": 0.6515864729881287, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.19681, "t": 269.35266, "r": 337.2016, "b": 279.48308999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.0329, "t": 252.67895999999996, "r": 390.03769, "b": 262.80939, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 1, "num_cols": 1, "table_cells": [ { "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 308.862, "t": 514.50037, "r": 545.11517, "b": 559.2729, "coord_origin": "TOPLEFT" }, "confidence": 0.9214619398117065, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 523.40692, "r_x1": 345.73361, "r_y1": 523.40692, "r_x2": 345.73361, "r_y2": 514.50037, "r_x3": 308.862, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.17566, "r_y0": 523.40692, "r_x1": 545.11511, "r_y1": 523.40692, "r_x2": 545.11511, "r_y2": 514.50037, "r_x3": 353.17566, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 535.3619100000001, "r_x1": 545.11511, "r_y1": 535.3619100000001, "r_x2": 545.11511, "r_y2": 526.45535, "r_x3": 308.862, "r_y3": 526.45535, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 547.31691, "r_x1": 545.11517, "r_y1": 547.31691, "r_x2": 545.11517, "r_y2": 538.41035, "r_x3": 308.862, "r_y3": 538.41035, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 559.2729, "r_x1": 505.6917700000001, "r_y1": 559.2729, "r_x2": 505.6917700000001, "r_y2": 550.36635, "r_x3": 308.862, "r_y3": 550.36635, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'." }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 584.40936, "r": 545.11517, "b": 665.04693, "coord_origin": "TOPLEFT" }, "confidence": 0.9848759770393372, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 593.31592, "r_x1": 545.11493, "r_y1": 593.31592, "r_x2": 545.11493, "r_y2": 584.40936, "r_x3": 320.81699, "r_y3": 584.40936, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2709199999999, "r_x1": 545.11517, "r_y1": 605.2709199999999, "r_x2": 545.11517, "r_y2": 596.36436, "r_x3": 308.862, "r_y3": 596.36436, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.22592, "r_x1": 545.11511, "r_y1": 617.22592, "r_x2": 545.11511, "r_y2": 608.31937, "r_x3": 308.862, "r_y3": 608.31937, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.18092, "r_x1": 545.11505, "r_y1": 629.18092, "r_x2": 545.11505, "r_y2": 620.27437, "r_x3": 308.862, "r_y3": 620.27437, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.13692, "r_x1": 353.6937, "r_y1": 641.13692, "r_x2": 353.6937, "r_y2": 632.23036, "r_x3": 308.862, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11209, "r_y0": 641.13692, "r_x1": 374.66617, "r_y1": 641.13692, "r_x2": 374.66617, "r_y2": 632.23036, "r_x3": 362.11209, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.35785, "r_y0": 641.13692, "r_x1": 545.11505, "r_y1": 641.13692, "r_x2": 545.11505, "r_y2": 632.23036, "r_x3": 377.35785, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.09192, "r_x1": 545.11517, "r_y1": 653.09192, "r_x2": 545.11517, "r_y2": 644.18536, "r_x3": 308.862, "r_y3": 644.18536, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.04693, "r_x1": 375.55167, "r_y1": 665.04693, "r_x2": 375.55167, "r_y2": 656.14037, "r_x3": 308.862, "r_y3": 656.14037, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document." }, { "label": "text", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.862, "t": 668.38036, "r": 545.11511, "b": 713.151932, "coord_origin": "TOPLEFT" }, "confidence": 0.979152262210846, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 677.28693, "r_x1": 545.11493, "r_y1": 677.28693, "r_x2": 545.11493, "r_y2": 668.38036, "r_x3": 320.81699, "r_y3": 668.38036, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24193, "r_x1": 545.11511, "r_y1": 689.24193, "r_x2": 545.11511, "r_y2": 680.33536, "r_x3": 308.862, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.19693, "r_x1": 545.11511, "r_y1": 701.19693, "r_x2": 545.11511, "r_y2": 692.290359, "r_x3": 308.862, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151932, "r_x1": 545.11499, "r_y1": 713.151932, "r_x2": 545.11499, "r_y2": 704.245361, "r_x3": 308.862, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be" }, { "label": "page_footer", "id": 12, "page_no": 0, "cluster": { "id": 12, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133366, "r": 300.10229, "b": 743.039928, "coord_origin": "TOPLEFT" }, "confidence": 0.8045893311500549, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1" }, { "label": "page_header", "id": 9, "page_no": 0, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 18.340221, "t": 207.82001000000002, "r": 36.339779, "b": 560.00003, "coord_origin": "TOPLEFT" }, "confidence": 0.8773143887519836, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340221, "r_y0": 560.00003, "r_x1": 36.339779, "r_y1": 560.00003, "r_x2": 36.339779, "r_y2": 207.82001000000002, "r_x3": 18.340221, "r_y3": 207.82001000000002, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022" } ], "body": [ { "label": "section_header", "id": 8, "page_no": 0, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 96.301003, "t": 107.03412000000003, "r": 498.92708999999996, "b": 119.93133999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.8868067860603333, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.301003, "r_y0": 119.93133999999998, "r_x1": 498.92708999999996, "r_y1": 119.93133999999998, "r_x2": 498.92708999999996, "r_y2": 107.03412000000003, "r_x3": 96.301003, "r_y3": 107.03412000000003, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers." }, { "label": "section_header", "id": 13, "page_no": 0, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 142.47701, "t": 146.68535999999995, "r": 452.75027, "b": 171.32037000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.7586215734481812, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.47701, "r_y0": 157.37334999999996, "r_x1": 452.75027, "r_y1": 157.37334999999996, "r_x2": 452.75027, "r_y2": 146.68535999999995, "r_x3": 142.47701, "r_y3": 146.68535999999995, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.918, "r_y0": 171.32037000000003, "r_x1": 332.30597, "r_y1": 171.32037000000003, "r_x2": 332.30597, "r_y2": 160.63239, "r_x3": 262.918, "r_y3": 160.63239, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research" }, { "label": "key_value_region", "id": 25, "page_no": 0, "cluster": { "id": 25, "label": "key_value_region", "bbox": { "l": 208.123, "t": 175.96123999999998, "r": 378.73257, "b": 184.42553999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.4854728579521179, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.123, "r_y0": 184.42553999999996, "r_x1": 212.73083, "r_y1": 184.42553999999996, "r_x2": 212.73083, "r_y2": 175.96123999999998, "r_x3": 208.123, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.00409000000002, "r_x1": 293.42761, "r_y1": 184.00409000000002, "r_x2": 293.42761, "r_y2": 177.08203000000003, "r_x3": 212.73, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.42798, "r_y0": 184.42553999999996, "r_x1": 298.0358, "r_y1": 184.42553999999996, "r_x2": 298.0358, "r_y2": 175.96123999999998, "r_x3": 293.42798, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03497, "r_y0": 184.00409000000002, "r_x1": 378.73257, "r_y1": 184.00409000000002, "r_x2": 378.73257, "r_y2": 177.08203000000003, "r_x3": 298.03497, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 208.123, "t": 175.96123999999998, "r": 378.73257, "b": 184.42553999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9096331596374512, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.123, "r_y0": 184.42553999999996, "r_x1": 212.73083, "r_y1": 184.42553999999996, "r_x2": 212.73083, "r_y2": 175.96123999999998, "r_x3": 208.123, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.00409000000002, "r_x1": 293.42761, "r_y1": 184.00409000000002, "r_x2": 293.42761, "r_y2": 177.08203000000003, "r_x3": 212.73, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.42798, "r_y0": 184.42553999999996, "r_x1": 298.0358, "r_y1": 184.42553999999996, "r_x2": 298.0358, "r_y2": 175.96123999999998, "r_x3": 293.42798, "r_y3": 175.96123999999998, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03497, "r_y0": 184.00409000000002, "r_x1": 378.73257, "r_y1": 184.00409000000002, "r_x2": 378.73257, "r_y2": 177.08203000000003, "r_x3": 298.03497, "r_y3": 177.08203000000003, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 145.99498, "t": 215.48297000000002, "r": 190.48029, "b": 226.23071000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9258671402931213, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99498, "r_y0": 226.23071000000004, "r_x1": 190.48029, "r_y1": 226.23071000000004, "r_x2": 190.48029, "r_y2": 215.48297000000002, "r_x3": 145.99498, "r_y3": 215.48297000000002, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract" }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.111977, "t": 241.39508, "r": 286.36511, "b": 512.9966400000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9838882088661194, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 249.98284999999998, "r_x1": 286.36493, "r_y1": 249.98284999999998, "r_x2": 286.36493, "r_y2": 241.39508, "r_x3": 62.066978, "r_y3": 241.39508, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 261.93787, "r_x1": 286.36508, "r_y1": 261.93787, "r_x2": 286.36508, "r_y2": 253.3501, "r_x3": 50.111977, "r_y3": 253.3501, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 273.89288, "r_x1": 286.36508, "r_y1": 273.89288, "r_x2": 286.36508, "r_y2": 265.30511, "r_x3": 50.111977, "r_y3": 265.30511, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 285.84888, "r_x1": 286.36505, "r_y1": 285.84888, "r_x2": 286.36505, "r_y2": 277.26111000000003, "r_x3": 50.111977, "r_y3": 277.26111000000003, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 297.80386, "r_x1": 286.36505, "r_y1": 297.80386, "r_x2": 286.36505, "r_y2": 289.21609, "r_x3": 50.111977, "r_y3": 289.21609, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 309.75884999999994, "r_x1": 286.36505, "r_y1": 309.75884999999994, "r_x2": 286.36505, "r_y2": 301.17108, "r_x3": 50.111977, "r_y3": 301.17108, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 321.71384, "r_x1": 286.36508, "r_y1": 321.71384, "r_x2": 286.36508, "r_y2": 313.12607, "r_x3": 50.111977, "r_y3": 313.12607, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 333.66882, "r_x1": 286.36508, "r_y1": 333.66882, "r_x2": 286.36508, "r_y2": 325.08105, "r_x3": 50.111977, "r_y3": 325.08105, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 345.62381, "r_x1": 286.36505, "r_y1": 345.62381, "r_x2": 286.36505, "r_y2": 337.03604, "r_x3": 50.111977, "r_y3": 337.03604, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 357.5798, "r_x1": 286.36508, "r_y1": 357.5798, "r_x2": 286.36508, "r_y2": 348.99203, "r_x3": 50.111977, "r_y3": 348.99203, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 369.53479, "r_x1": 286.36505, "r_y1": 369.53479, "r_x2": 286.36505, "r_y2": 360.94701999999995, "r_x3": 50.111977, "r_y3": 360.94701999999995, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 381.48978, "r_x1": 286.36508, "r_y1": 381.48978, "r_x2": 286.36508, "r_y2": 372.90201, "r_x3": 50.111977, "r_y3": 372.90201, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 393.44476, "r_x1": 286.36505, "r_y1": 393.44476, "r_x2": 286.36505, "r_y2": 384.85699, "r_x3": 50.111977, "r_y3": 384.85699, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 405.39975000000004, "r_x1": 286.36511, "r_y1": 405.39975000000004, "r_x2": 286.36511, "r_y2": 396.81198, "r_x3": 50.111977, "r_y3": 396.81198, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 417.35474, "r_x1": 286.36508, "r_y1": 417.35474, "r_x2": 286.36508, "r_y2": 408.76697, "r_x3": 50.111977, "r_y3": 408.76697, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 429.31073, "r_x1": 286.36505, "r_y1": 429.31073, "r_x2": 286.36505, "r_y2": 420.72296000000006, "r_x3": 50.111977, "r_y3": 420.72296000000006, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 441.26572, "r_x1": 207.23216, "r_y1": 441.26572, "r_x2": 207.23216, "r_y2": 432.67795, "r_x3": 50.111977, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.09639, "r_y0": 441.26572, "r_x1": 286.36508, "r_y1": 441.26572, "r_x2": 286.36508, "r_y2": 432.67795, "r_x3": 214.09639, "r_y3": 432.67795, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 453.2207, "r_x1": 286.36508, "r_y1": 453.2207, "r_x2": 286.36508, "r_y2": 444.63293, "r_x3": 50.111977, "r_y3": 444.63293, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 465.17569, "r_x1": 286.36505, "r_y1": 465.17569, "r_x2": 286.36505, "r_y2": 456.58792000000005, "r_x3": 50.111977, "r_y3": 456.58792000000005, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 477.13068, "r_x1": 286.36505, "r_y1": 477.13068, "r_x2": 286.36505, "r_y2": 468.54291, "r_x3": 50.111977, "r_y3": 468.54291, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 489.08667, "r_x1": 286.36508, "r_y1": 489.08667, "r_x2": 286.36508, "r_y2": 480.4989, "r_x3": 50.111977, "r_y3": 480.4989, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 501.04166, "r_x1": 286.36505, "r_y1": 501.04166, "r_x2": 286.36505, "r_y2": 492.45389, "r_x3": 50.111977, "r_y3": 492.45389, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 512.9966400000001, "r_x1": 276.65152, "r_y1": 512.9966400000001, "r_x2": 276.65152, "r_y2": 504.40887, "r_x3": 50.111977, "r_y3": 504.40887, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables." }, { "label": "section_header", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 50.111977, "t": 539.94276, "r": 126.94804, "b": 550.69049, "coord_origin": "TOPLEFT" }, "confidence": 0.9317677617073059, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 550.69049, "r_x1": 58.121296, "r_y1": 550.69049, "r_x2": 58.121296, "r_y2": 539.94276, "r_x3": 50.111977, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.800385, "r_y0": 550.69049, "r_x1": 126.94804, "r_y1": 550.69049, "r_x2": 126.94804, "r_y2": 539.94276, "r_x3": 68.800385, "r_y3": 539.94276, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Introduction" }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.111977, "t": 560.7832, "r": 286.36508, "b": 713.151779, "coord_origin": "TOPLEFT" }, "confidence": 0.9841895699501038, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066978, "r_y0": 569.68976, "r_x1": 286.36496, "r_y1": 569.68976, "r_x2": 286.36496, "r_y2": 560.7832, "r_x3": 62.066978, "r_y3": 560.7832, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 581.64476, "r_x1": 286.36508, "r_y1": 581.64476, "r_x2": 286.36508, "r_y2": 572.7382, "r_x3": 50.111977, "r_y3": 572.7382, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 593.5997600000001, "r_x1": 286.36505, "r_y1": 593.5997600000001, "r_x2": 286.36505, "r_y2": 584.69321, "r_x3": 50.111977, "r_y3": 584.69321, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 605.55576, "r_x1": 286.36505, "r_y1": 605.55576, "r_x2": 286.36505, "r_y2": 596.6492000000001, "r_x3": 50.111977, "r_y3": 596.6492000000001, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 617.51076, "r_x1": 286.36505, "r_y1": 617.51076, "r_x2": 286.36505, "r_y2": 608.6042, "r_x3": 50.111977, "r_y3": 608.6042, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 629.46576, "r_x1": 286.36505, "r_y1": 629.46576, "r_x2": 286.36505, "r_y2": 620.5592, "r_x3": 50.111977, "r_y3": 620.5592, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 641.42076, "r_x1": 286.36508, "r_y1": 641.42076, "r_x2": 286.36508, "r_y2": 632.51421, "r_x3": 50.111977, "r_y3": 632.51421, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 653.37576, "r_x1": 286.36508, "r_y1": 653.37576, "r_x2": 286.36508, "r_y2": 644.46921, "r_x3": 50.111977, "r_y3": 644.46921, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 665.33077, "r_x1": 286.36502, "r_y1": 665.33077, "r_x2": 286.36502, "r_y2": 656.42421, "r_x3": 50.111977, "r_y3": 656.42421, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 677.28677, "r_x1": 286.36505, "r_y1": 677.28677, "r_x2": 286.36505, "r_y2": 668.3802000000001, "r_x3": 50.111977, "r_y3": 668.3802000000001, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 689.2417800000001, "r_x1": 286.36505, "r_y1": 689.2417800000001, "r_x2": 286.36505, "r_y2": 680.33521, "r_x3": 50.111977, "r_y3": 680.33521, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 701.196777, "r_x1": 286.36505, "r_y1": 701.196777, "r_x2": 286.36505, "r_y2": 692.290207, "r_x3": 50.111977, "r_y3": 692.290207, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111977, "r_y0": 713.151779, "r_x1": 76.403275, "r_y1": 713.151779, "r_x2": 76.403275, "r_y2": 704.245209, "r_x3": 50.111977, "r_y3": 704.245209, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues." }, { "label": "section_header", "id": 14, "page_no": 0, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 315.56702, "t": 218.00684, "r": 408.4407, "b": 226.75482, "coord_origin": "TOPLEFT" }, "confidence": 0.6724023818969727, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 226.75482, "r_x1": 324.01007, "r_y1": 226.75482, "r_x2": 324.01007, "r_y2": 218.00684, "r_x3": 315.56702, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.2316, "r_y0": 226.75482, "r_x1": 408.4407, "r_y1": 226.75482, "r_x2": 408.4407, "r_y2": 218.00684, "r_x3": 328.2316, "r_y3": 218.00684, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a. Picture of a table:" }, { "label": "list_item", "id": 17, "page_no": 0, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 315.56702, "t": 313.69478999999995, "r": 486.40194999999994, "b": 333.2428, "coord_origin": "TOPLEFT" }, "confidence": 0.5549328923225403, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 322.44281, "r_x1": 325.05786, "r_y1": 322.44281, "r_x2": 325.05786, "r_y2": 313.69478999999995, "r_x3": 315.56702, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.80325, "r_y0": 322.44281, "r_x1": 486.40194999999994, "r_y1": 322.44281, "r_x2": 486.40194999999994, "r_y2": 313.69478999999995, "r_x3": 329.80325, "r_y3": 313.69478999999995, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46252, "r_y0": 333.2428, "r_x1": 472.47411999999997, "r_y1": 333.2428, "r_x2": 472.47411999999997, "r_y2": 324.49478, "r_x3": 326.46252, "r_y3": 324.49478, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer" }, { "label": "list_item", "id": 18, "page_no": 0, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 315.56702, "t": 420.1828, "r": 491.1912500000001, "b": 428.93082, "coord_origin": "TOPLEFT" }, "confidence": 0.5501358509063721, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.56702, "r_y0": 428.93082, "r_x1": 324.81039, "r_y1": 428.93082, "r_x2": 324.81039, "r_y2": 420.1828, "r_x3": 315.56702, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.4321, "r_y0": 428.93082, "r_x1": 491.1912500000001, "r_y1": 428.93082, "r_x2": 491.1912500000001, "r_y2": 420.1828, "r_x3": 329.4321, "r_y3": 420.1828, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "c. Structure predicted by TableFormer:" }, { "label": "picture", "id": 10, "page_no": 0, "cluster": { "id": 10, "label": "picture", "bbox": { "l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT" }, "confidence": 0.8742761611938477, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.14752, "r_y0": 351.61322, "r_x1": 412.54001, "r_y1": 351.61322, "r_x2": 412.54001, "r_y2": 342.82828, "r_x3": 408.14752, "r_y3": 342.82828, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11011, "r_y0": 350.35712, "r_x1": 360.50259, "r_y1": 350.35712, "r_x2": 360.50259, "r_y2": 341.57217, "r_x3": 356.11011, "r_y3": 341.57217, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.6777, "r_y0": 349.7226299999999, "r_x1": 505.0701900000001, "r_y1": 349.7226299999999, "r_x2": 505.0701900000001, "r_y2": 340.93768, "r_x3": 500.6777, "r_y3": 340.93768, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13382, "r_y0": 360.53284, "r_x1": 360.52631, "r_y1": 360.53284, "r_x2": 360.52631, "r_y2": 351.74789, "r_x3": 356.13382, "r_y3": 351.74789, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.53992, "r_y0": 364.66144, "r_x1": 406.9324, "r_y1": 364.66144, "r_x2": 406.9324, "r_y2": 355.8765, "r_x3": 402.53992, "r_y3": 355.8765, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58178999999996, "r_y0": 361.62512, "r_x1": 452.97427, "r_y1": 361.62512, "r_x2": 452.97427, "r_y2": 352.84018, "r_x3": 448.58178999999996, "r_y3": 352.84018, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65161000000006, "r_y0": 362.49152, "r_x1": 496.0441, "r_y1": 362.49152, "r_x2": 496.0441, "r_y2": 353.70657, "r_x3": 491.65161000000006, "r_y3": 353.70657, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.13843, "r_y0": 362.12463, "r_x1": 539.53088, "r_y1": 362.12463, "r_x2": 539.53088, "r_y2": 353.33969, "r_x3": 535.13843, "r_y3": 353.33969, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.82822, "r_y0": 395.88275, "r_x1": 353.2207, "r_y1": 395.88275, "r_x2": 353.2207, "r_y2": 387.09781, "r_x3": 348.82822, "r_y3": 387.09781, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27151, "r_y0": 384.15723, "r_x1": 393.664, "r_y1": 384.15723, "r_x2": 393.664, "r_y2": 375.37228, "r_x3": 389.27151, "r_y3": 375.37228, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67479999999995, "r_y0": 384.43115, "r_x1": 451.45889000000005, "r_y1": 384.43115, "r_x2": 451.45889000000005, "r_y2": 375.64621, "r_x3": 442.67479999999995, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.4382299999999, "r_y0": 384.31894000000005, "r_x1": 485.90167, "r_y1": 384.31894000000005, "r_x2": 485.90167, "r_y2": 375.534, "r_x3": 477.4382299999999, "r_y3": 375.534, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57263, "r_y0": 384.43115, "r_x1": 531.35669, "r_y1": 384.43115, "r_x2": 531.35669, "r_y2": 375.64621, "r_x3": 522.57263, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.22992, "r_y0": 395.89923, "r_x1": 409.01401, "r_y1": 395.89923, "r_x2": 409.01401, "r_y2": 387.11429, "r_x3": 400.22992, "r_y3": 387.11429, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30792, "r_y0": 395.77475000000004, "r_x1": 451.0920100000001, "r_y1": 395.77475000000004, "r_x2": 451.0920100000001, "r_y2": 386.98981000000003, "r_x3": 442.30792, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.21941999999996, "r_y0": 396.15964, "r_x1": 487.00351000000006, "r_y1": 396.15964, "r_x2": 487.00351000000006, "r_y2": 387.37469, "r_x3": 478.21941999999996, "r_y3": 387.37469, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.2287, "r_y0": 395.77475000000004, "r_x1": 532.01276, "r_y1": 395.77475000000004, "r_x2": 532.01276, "r_y2": 386.98981000000003, "r_x3": 523.2287, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57233, "r_y0": 408.20972, "r_x1": 415.96481, "r_y1": 408.20972, "r_x2": 415.96481, "r_y2": 399.42477, "r_x3": 411.57233, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96393, "r_y0": 408.20972, "r_x1": 420.35641, "r_y1": 408.20972, "r_x2": 420.35641, "r_y2": 399.42477, "r_x3": 415.96393, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30521, "r_y0": 407.82213999999993, "r_x1": 451.08929, "r_y1": 407.82213999999993, "r_x2": 451.08929, "r_y2": 399.0371999999999, "r_x3": 442.30521, "r_y3": 399.0371999999999, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.77893, "r_y0": 407.78133999999994, "r_x1": 487.56302, "r_y1": 407.78133999999994, "r_x2": 487.56302, "r_y2": 398.99639999999994, "r_x3": 478.77893, "r_y3": 398.99639999999994, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97241, "r_y0": 407.39642, "r_x1": 532.75647, "r_y1": 407.39642, "r_x2": 532.75647, "r_y2": 398.6114799999999, "r_x3": 523.97241, "r_y3": 398.6114799999999, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09399, "r_y0": 367.89072, "r_x1": 391.09879, "r_y1": 367.89072, "r_x2": 391.09879, "r_y2": 357.76030999999995, "r_x3": 385.09399, "r_y3": 357.76030999999995, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43451, "r_y0": 390.85689999999994, "r_x1": 339.4393, "r_y1": 390.85689999999994, "r_x2": 339.4393, "r_y2": 380.7265, "r_x3": 333.43451, "r_y3": 380.7265, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07210999999995, "r_y0": 351.16720999999995, "r_x1": 484.0769, "r_y1": 351.16720999999995, "r_x2": 484.0769, "r_y2": 341.0368000000001, "r_x3": 478.07210999999995, "r_y3": 341.0368000000001, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 40, "label": "text", "bbox": { "l": 408.14752, "t": 342.82828, "r": 412.54001, "b": 351.61322, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.14752, "r_y0": 351.61322, "r_x1": 412.54001, "r_y1": 351.61322, "r_x2": 412.54001, "r_y2": 342.82828, "r_x3": 408.14752, "r_y3": 342.82828, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 356.11011, "t": 341.57217, "r": 360.50259, "b": 350.35712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11011, "r_y0": 350.35712, "r_x1": 360.50259, "r_y1": 350.35712, "r_x2": 360.50259, "r_y2": 341.57217, "r_x3": 356.11011, "r_y3": 341.57217, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 500.6777, "t": 340.93768, "r": 505.0701900000001, "b": 349.7226299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.6777, "r_y0": 349.7226299999999, "r_x1": 505.0701900000001, "r_y1": 349.7226299999999, "r_x2": 505.0701900000001, "r_y2": 340.93768, "r_x3": 500.6777, "r_y3": 340.93768, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 356.13382, "t": 351.74789, "r": 360.52631, "b": 360.53284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13382, "r_y0": 360.53284, "r_x1": 360.52631, "r_y1": 360.53284, "r_x2": 360.52631, "r_y2": 351.74789, "r_x3": 356.13382, "r_y3": 351.74789, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 402.53992, "t": 355.8765, "r": 406.9324, "b": 364.66144, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.53992, "r_y0": 364.66144, "r_x1": 406.9324, "r_y1": 364.66144, "r_x2": 406.9324, "r_y2": 355.8765, "r_x3": 402.53992, "r_y3": 355.8765, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 448.58178999999996, "t": 352.84018, "r": 452.97427, "b": 361.62512, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58178999999996, "r_y0": 361.62512, "r_x1": 452.97427, "r_y1": 361.62512, "r_x2": 452.97427, "r_y2": 352.84018, "r_x3": 448.58178999999996, "r_y3": 352.84018, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 491.65161000000006, "t": 353.70657, "r": 496.0441, "b": 362.49152, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65161000000006, "r_y0": 362.49152, "r_x1": 496.0441, "r_y1": 362.49152, "r_x2": 496.0441, "r_y2": 353.70657, "r_x3": 491.65161000000006, "r_y3": 353.70657, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 535.13843, "t": 353.33969, "r": 539.53088, "b": 362.12463, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.13843, "r_y0": 362.12463, "r_x1": 539.53088, "r_y1": 362.12463, "r_x2": 539.53088, "r_y2": 353.33969, "r_x3": 535.13843, "r_y3": 353.33969, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 348.82822, "t": 387.09781, "r": 353.2207, "b": 395.88275, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.82822, "r_y0": 395.88275, "r_x1": 353.2207, "r_y1": 395.88275, "r_x2": 353.2207, "r_y2": 387.09781, "r_x3": 348.82822, "r_y3": 387.09781, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 389.27151, "t": 375.37228, "r": 393.664, "b": 384.15723, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27151, "r_y0": 384.15723, "r_x1": 393.664, "r_y1": 384.15723, "r_x2": 393.664, "r_y2": 375.37228, "r_x3": 389.27151, "r_y3": 375.37228, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 442.67479999999995, "t": 375.64621, "r": 451.45889000000005, "b": 384.43115, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67479999999995, "r_y0": 384.43115, "r_x1": 451.45889000000005, "r_y1": 384.43115, "r_x2": 451.45889000000005, "r_y2": 375.64621, "r_x3": 442.67479999999995, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 477.4382299999999, "t": 375.534, "r": 485.90167, "b": 384.31894000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.4382299999999, "r_y0": 384.31894000000005, "r_x1": 485.90167, "r_y1": 384.31894000000005, "r_x2": 485.90167, "r_y2": 375.534, "r_x3": 477.4382299999999, "r_y3": 375.534, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 522.57263, "t": 375.64621, "r": 531.35669, "b": 384.43115, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57263, "r_y0": 384.43115, "r_x1": 531.35669, "r_y1": 384.43115, "r_x2": 531.35669, "r_y2": 375.64621, "r_x3": 522.57263, "r_y3": 375.64621, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 400.22992, "t": 387.11429, "r": 409.01401, "b": 395.89923, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.22992, "r_y0": 395.89923, "r_x1": 409.01401, "r_y1": 395.89923, "r_x2": 409.01401, "r_y2": 387.11429, "r_x3": 400.22992, "r_y3": 387.11429, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 442.30792, "t": 386.98981000000003, "r": 451.0920100000001, "b": 395.77475000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30792, "r_y0": 395.77475000000004, "r_x1": 451.0920100000001, "r_y1": 395.77475000000004, "r_x2": 451.0920100000001, "r_y2": 386.98981000000003, "r_x3": 442.30792, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 478.21941999999996, "t": 387.37469, "r": 487.00351000000006, "b": 396.15964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.21941999999996, "r_y0": 396.15964, "r_x1": 487.00351000000006, "r_y1": 396.15964, "r_x2": 487.00351000000006, "r_y2": 387.37469, "r_x3": 478.21941999999996, "r_y3": 387.37469, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 523.2287, "t": 386.98981000000003, "r": 532.01276, "b": 395.77475000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.2287, "r_y0": 395.77475000000004, "r_x1": 532.01276, "r_y1": 395.77475000000004, "r_x2": 532.01276, "r_y2": 386.98981000000003, "r_x3": 523.2287, "r_y3": 386.98981000000003, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 411.57233, "t": 399.42477, "r": 415.96481, "b": 408.20972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57233, "r_y0": 408.20972, "r_x1": 415.96481, "r_y1": 408.20972, "r_x2": 415.96481, "r_y2": 399.42477, "r_x3": 411.57233, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 415.96393, "t": 399.42477, "r": 420.35641, "b": 408.20972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96393, "r_y0": 408.20972, "r_x1": 420.35641, "r_y1": 408.20972, "r_x2": 420.35641, "r_y2": 399.42477, "r_x3": 415.96393, "r_y3": 399.42477, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 442.30521, "t": 399.0371999999999, "r": 451.08929, "b": 407.82213999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.30521, "r_y0": 407.82213999999993, "r_x1": 451.08929, "r_y1": 407.82213999999993, "r_x2": 451.08929, "r_y2": 399.0371999999999, "r_x3": 442.30521, "r_y3": 399.0371999999999, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 478.77893, "t": 398.99639999999994, "r": 487.56302, "b": 407.78133999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.77893, "r_y0": 407.78133999999994, "r_x1": 487.56302, "r_y1": 407.78133999999994, "r_x2": 487.56302, "r_y2": 398.99639999999994, "r_x3": 478.77893, "r_y3": 398.99639999999994, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 523.97241, "t": 398.6114799999999, "r": 532.75647, "b": 407.39642, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97241, "r_y0": 407.39642, "r_x1": 532.75647, "r_y1": 407.39642, "r_x2": 532.75647, "r_y2": 398.6114799999999, "r_x3": 523.97241, "r_y3": 398.6114799999999, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 385.09399, "t": 357.76030999999995, "r": 391.09879, "b": 367.89072, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09399, "r_y0": 367.89072, "r_x1": 391.09879, "r_y1": 367.89072, "r_x2": 391.09879, "r_y2": 357.76030999999995, "r_x3": 385.09399, "r_y3": 357.76030999999995, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 333.43451, "t": 380.7265, "r": 339.4393, "b": 390.85689999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43451, "r_y0": 390.85689999999994, "r_x1": 339.4393, "r_y1": 390.85689999999994, "r_x2": 339.4393, "r_y2": 380.7265, "r_x3": 333.43451, "r_y3": 380.7265, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 478.07210999999995, "t": 341.0368000000001, "r": 484.0769, "b": 351.16720999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07210999999995, "r_y0": 351.16720999999995, "r_x1": 484.0769, "r_y1": 351.16720999999995, "r_x2": 484.0769, "r_y2": 341.0368000000001, "r_x3": 478.07210999999995, "r_y3": 341.0368000000001, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 23, "page_no": 0, "cluster": { "id": 23, "label": "picture", "bbox": { "l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT" }, "confidence": 0.5088632702827454, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.10422, "t": 437.68588, "r": 398.4967, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.24872, "t": 449.5455, "r": 351.6412, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.70102, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.90424, "t": 473.32291, "r": 337.90903, "b": 483.45331, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.87621999999993, "t": 437.5936, "r": 465.88101, "b": 447.724, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 0, "cluster": { "id": 11, "label": "table", "bbox": { "l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT" }, "confidence": 0.8056110739707947, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 446.47083, "r_x1": 351.6412, "r_y1": 446.47083, "r_x2": 351.6412, "r_y2": 437.68588, "r_x3": 347.24872, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88071, "r_y0": 446.47083, "r_x1": 323.27319, "r_y1": 446.47083, "r_x2": 323.27319, "r_y2": 437.68588, "r_x3": 318.88071, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.10422, "t": 437.68588, "r": 398.4967, "b": 446.47083, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 446.47083, "r_x1": 398.4967, "r_y1": 446.47083, "r_x2": 398.4967, "r_y2": 437.68588, "r_x3": 394.10422, "r_y3": 437.68588, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 458.33044, "r_x1": 323.16565, "r_y1": 458.33044, "r_x2": 323.16565, "r_y2": 449.5455, "r_x3": 318.77316, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.24872, "t": 449.5455, "r": 351.6412, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 458.33044, "r_x1": 351.6412, "r_y1": 458.33044, "r_x2": 351.6412, "r_y2": 449.5455, "r_x3": 347.24872, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 458.33044, "r_x1": 398.4967, "r_y1": 458.33044, "r_x2": 398.4967, "r_y2": 449.5455, "r_x3": 394.10422, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 458.33044, "r_x1": 445.3519, "r_y1": 458.33044, "r_x2": 445.3519, "r_y2": 449.5455, "r_x3": 440.95941000000005, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 458.33044, "r_x1": 492.2074, "r_y1": 458.33044, "r_x2": 492.2074, "r_y2": 449.5455, "r_x3": 487.81491, "r_y3": 449.5455, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77316, "r_y0": 482.4892, "r_x1": 323.16565, "r_y1": 482.4892, "r_x2": 323.16565, "r_y2": 473.70425, "r_x3": 318.77316, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 470.62955, "r_x1": 351.6412, "r_y1": 470.62955, "r_x2": 351.6412, "r_y2": 461.8446, "r_x3": 347.24872, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 470.62955, "r_x1": 402.88831, "r_y1": 470.62955, "r_x2": 402.88831, "r_y2": 461.8446, "r_x3": 394.10422, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 470.62955, "r_x1": 449.42285, "r_y1": 470.62955, "r_x2": 449.42285, "r_y2": 461.8446, "r_x3": 440.95941000000005, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 470.62955, "r_x1": 496.599, "r_y1": 470.62955, "r_x2": 496.599, "r_y2": 461.8446, "r_x3": 487.81491, "r_y3": 461.8446, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 482.4892, "r_x1": 356.03281, "r_y1": 482.4892, "r_x2": 356.03281, "r_y2": 473.70425, "r_x3": 347.24872, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 482.4892, "r_x1": 402.88831, "r_y1": 482.4892, "r_x2": 402.88831, "r_y2": 473.70425, "r_x3": 394.10422, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 482.4892, "r_x1": 449.7435, "r_y1": 482.4892, "r_x2": 449.7435, "r_y2": 473.70425, "r_x3": 440.95941000000005, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 482.4892, "r_x1": 496.599, "r_y1": 482.4892, "r_x2": 496.599, "r_y2": 473.70425, "r_x3": 487.81491, "r_y3": 473.70425, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.24872, "r_y0": 493.90964, "r_x1": 356.03281, "r_y1": 493.90964, "r_x2": 356.03281, "r_y2": 485.12469, "r_x3": 347.24872, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.10422, "r_y0": 493.90964, "r_x1": 402.88831, "r_y1": 493.90964, "r_x2": 402.88831, "r_y2": 485.12469, "r_x3": 394.10422, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.95941000000005, "r_y0": 493.90964, "r_x1": 449.7435, "r_y1": 493.90964, "r_x2": 449.7435, "r_y2": 485.12469, "r_x3": 440.95941000000005, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81491, "r_y0": 493.90964, "r_x1": 496.599, "r_y1": 493.90964, "r_x2": 496.599, "r_y2": 485.12469, "r_x3": 487.81491, "r_y3": 485.12469, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.70102, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.70102, "r_y0": 459.25122, "r_x1": 372.70581, "r_y1": 459.25122, "r_x2": 372.70581, "r_y2": 449.12082, "r_x3": 366.70102, "r_y3": 449.12082, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.90424, "t": 473.32291, "r": 337.90903, "b": 483.45331, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.90424, "r_y0": 483.45331, "r_x1": 337.90903, "r_y1": 483.45331, "r_x2": 337.90903, "r_y2": 473.32291, "r_x3": 331.90424, "r_y3": 473.32291, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.87621999999993, "t": 437.5936, "r": 465.88101, "b": 447.724, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.87621999999993, "r_y0": 447.724, "r_x1": 465.88101, "r_y1": 447.724, "r_x2": 465.88101, "r_y2": 437.5936, "r_x3": 459.87621999999993, "r_y3": 437.5936, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 5, "table_cells": [ { "bbox": { "l": 347.24872, "t": 437.68588, "r": 351.6412, "b": 446.47083, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.88071, "t": 437.68588, "r": 323.27319, "b": 446.47083, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77316, "t": 449.5455, "r": 323.16565, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 449.12082, "r": 372.70581, "b": 459.25122, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 449.5455, "r": 398.4967, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 449.5455, "r": 445.3519, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 449.5455, "r": 492.2074, "b": 458.33044, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77316, "t": 473.70425, "r": 323.16565, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 461.8446, "r": 351.6412, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 461.8446, "r": 402.88831, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 461.8446, "r": 449.42285, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 461.8446, "r": 496.599, "b": 470.62955, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 473.70425, "r": 356.03281, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 473.70425, "r": 402.88831, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 473.70425, "r": 449.7435, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 473.70425, "r": 496.599, "b": 482.4892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.24872, "t": 485.12469, "r": 356.03281, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.10422, "t": 485.12469, "r": 402.88831, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.95941000000005, "t": 485.12469, "r": 449.7435, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81491, "t": 485.12469, "r": 496.599, "b": 493.90964, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "picture", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "picture", "bbox": { "l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT" }, "confidence": 0.608779788017273, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.19681, "t": 269.35266, "r": 337.2016, "b": 279.48308999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.0329, "t": 252.67895999999996, "r": 390.03769, "b": 262.80939, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 15, "page_no": 0, "cluster": { "id": 15, "label": "table", "bbox": { "l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT" }, "confidence": 0.6515864729881287, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9457100000001, "r_y0": 245.47748, "r_x1": 457.95050000000003, "r_y1": 245.47748, "r_x2": 457.95050000000003, "r_y2": 235.34704999999997, "r_x3": 451.9457100000001, "r_y3": 235.34704999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.19681, "t": 269.35266, "r": 337.2016, "b": 279.48308999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.19681, "r_y0": 279.48308999999995, "r_x1": 337.2016, "r_y1": 279.48308999999995, "r_x2": 337.2016, "r_y2": 269.35266, "r_x3": 331.19681, "r_y3": 269.35266, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.0329, "t": 252.67895999999996, "r": 390.03769, "b": 262.80939, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0329, "r_y0": 262.80939, "r_x1": 390.03769, "r_y1": 262.80939, "r_x2": 390.03769, "r_y2": 252.67895999999996, "r_x3": 384.0329, "r_y3": 252.67895999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 1, "num_cols": 1, "table_cells": [ { "bbox": { "l": 451.9457100000001, "t": 235.34704999999997, "r": 457.95050000000003, "b": 245.47748, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 308.862, "t": 514.50037, "r": 545.11517, "b": 559.2729, "coord_origin": "TOPLEFT" }, "confidence": 0.9214619398117065, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 523.40692, "r_x1": 345.73361, "r_y1": 523.40692, "r_x2": 345.73361, "r_y2": 514.50037, "r_x3": 308.862, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.17566, "r_y0": 523.40692, "r_x1": 545.11511, "r_y1": 523.40692, "r_x2": 545.11511, "r_y2": 514.50037, "r_x3": 353.17566, "r_y3": 514.50037, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 535.3619100000001, "r_x1": 545.11511, "r_y1": 535.3619100000001, "r_x2": 545.11511, "r_y2": 526.45535, "r_x3": 308.862, "r_y3": 526.45535, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 547.31691, "r_x1": 545.11517, "r_y1": 547.31691, "r_x2": 545.11517, "r_y2": 538.41035, "r_x3": 308.862, "r_y3": 538.41035, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 559.2729, "r_x1": 505.6917700000001, "r_y1": 559.2729, "r_x2": 505.6917700000001, "r_y2": 550.36635, "r_x3": 308.862, "r_y3": 550.36635, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'." }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 584.40936, "r": 545.11517, "b": 665.04693, "coord_origin": "TOPLEFT" }, "confidence": 0.9848759770393372, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 593.31592, "r_x1": 545.11493, "r_y1": 593.31592, "r_x2": 545.11493, "r_y2": 584.40936, "r_x3": 320.81699, "r_y3": 584.40936, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2709199999999, "r_x1": 545.11517, "r_y1": 605.2709199999999, "r_x2": 545.11517, "r_y2": 596.36436, "r_x3": 308.862, "r_y3": 596.36436, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.22592, "r_x1": 545.11511, "r_y1": 617.22592, "r_x2": 545.11511, "r_y2": 608.31937, "r_x3": 308.862, "r_y3": 608.31937, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.18092, "r_x1": 545.11505, "r_y1": 629.18092, "r_x2": 545.11505, "r_y2": 620.27437, "r_x3": 308.862, "r_y3": 620.27437, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.13692, "r_x1": 353.6937, "r_y1": 641.13692, "r_x2": 353.6937, "r_y2": 632.23036, "r_x3": 308.862, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11209, "r_y0": 641.13692, "r_x1": 374.66617, "r_y1": 641.13692, "r_x2": 374.66617, "r_y2": 632.23036, "r_x3": 362.11209, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.35785, "r_y0": 641.13692, "r_x1": 545.11505, "r_y1": 641.13692, "r_x2": 545.11505, "r_y2": 632.23036, "r_x3": 377.35785, "r_y3": 632.23036, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.09192, "r_x1": 545.11517, "r_y1": 653.09192, "r_x2": 545.11517, "r_y2": 644.18536, "r_x3": 308.862, "r_y3": 644.18536, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.04693, "r_x1": 375.55167, "r_y1": 665.04693, "r_x2": 375.55167, "r_y2": 656.14037, "r_x3": 308.862, "r_y3": 656.14037, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document." }, { "label": "text", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.862, "t": 668.38036, "r": 545.11511, "b": 713.151932, "coord_origin": "TOPLEFT" }, "confidence": 0.979152262210846, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 677.28693, "r_x1": 545.11493, "r_y1": 677.28693, "r_x2": 545.11493, "r_y2": 668.38036, "r_x3": 320.81699, "r_y3": 668.38036, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24193, "r_x1": 545.11511, "r_y1": 689.24193, "r_x2": 545.11511, "r_y2": 680.33536, "r_x3": 308.862, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.19693, "r_x1": 545.11511, "r_y1": 701.19693, "r_x2": 545.11511, "r_y2": 692.290359, "r_x3": 308.862, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151932, "r_x1": 545.11499, "r_y1": 713.151932, "r_x2": 545.11499, "r_y2": 704.245361, "r_x3": 308.862, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be" } ], "headers": [ { "label": "page_footer", "id": 12, "page_no": 0, "cluster": { "id": 12, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133366, "r": 300.10229, "b": 743.039928, "coord_origin": "TOPLEFT" }, "confidence": 0.8045893311500549, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1" }, { "label": "page_header", "id": 9, "page_no": 0, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 18.340221, "t": 207.82001000000002, "r": 36.339779, "b": 560.00003, "coord_origin": "TOPLEFT" }, "confidence": 0.8773143887519836, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340221, "r_y0": 560.00003, "r_x1": 36.339779, "r_y1": 560.00003, "r_x2": 36.339779, "r_y2": 207.82001000000002, "r_x3": 18.340221, "r_y3": 207.82001000000002, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022" } ] } }, { "page_no": 1, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36505, "r_y1": 84.11492999999996, "r_x2": 286.36505, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 112.64721999999999, "r_y1": 96.06994999999995, "r_x2": 112.64721999999999, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 108.47797000000003, "r_x1": 286.36496, "r_y1": 108.47797000000003, "r_x2": 286.36496, "r_y2": 99.57141000000001, "r_x3": 62.067001, "r_y3": 99.57141000000001, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.43297999999993, "r_x1": 74.749512, "r_y1": 120.43297999999993, "r_x2": 74.749512, "r_y2": 111.52643, "r_x3": 50.112, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.334793, "r_y0": 120.43297999999993, "r_x1": 286.36514, "r_y1": 120.43297999999993, "r_x2": 286.36514, "r_y2": 111.52643, "r_x3": 81.334793, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 132.38800000000003, "r_x1": 286.36511, "r_y1": 132.38800000000003, "r_x2": 286.36511, "r_y2": 123.48145, "r_x3": 50.112, "r_y3": 123.48145, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 144.34302000000002, "r_x1": 286.36511, "r_y1": 144.34302000000002, "r_x2": 286.36511, "r_y2": 135.43646, "r_x3": 50.112, "r_y3": 135.43646, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 156.29900999999995, "r_x1": 286.36505, "r_y1": 156.29900999999995, "r_x2": 286.36505, "r_y2": 147.39246000000003, "r_x3": 50.112, "r_y3": 147.39246000000003, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 168.25402999999994, "r_x1": 286.36511, "r_y1": 168.25402999999994, "r_x2": 286.36511, "r_y2": 159.34747000000004, "r_x3": 50.112, "r_y3": 159.34747000000004, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.20905000000005, "r_x1": 286.36508, "r_y1": 180.20905000000005, "r_x2": 286.36508, "r_y2": 171.30249000000003, "r_x3": 50.112, "r_y3": 171.30249000000003, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.16405999999995, "r_x1": 286.36511, "r_y1": 192.16405999999995, "r_x2": 286.36511, "r_y2": 183.25751000000002, "r_x3": 50.112, "r_y3": 183.25751000000002, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.11908000000005, "r_x1": 286.36508, "r_y1": 204.11908000000005, "r_x2": 286.36508, "r_y2": 195.21252000000004, "r_x3": 50.112, "r_y3": 195.21252000000004, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.07410000000004, "r_x1": 286.36514, "r_y1": 216.07410000000004, "r_x2": 286.36514, "r_y2": 207.16754000000003, "r_x3": 50.112, "r_y3": 207.16754000000003, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.03008999999997, "r_x1": 278.66397, "r_y1": 228.03008999999997, "r_x2": 278.66397, "r_y2": 219.12354000000005, "r_x3": 50.112, "r_y3": 219.12354000000005, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 240.43811000000005, "r_x1": 286.36493, "r_y1": 240.43811000000005, "r_x2": 286.36493, "r_y2": 231.53156, "r_x3": 62.067001, "r_y3": 231.53156, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 252.39313000000004, "r_x1": 286.36511, "r_y1": 252.39313000000004, "r_x2": 286.36511, "r_y2": 243.48657000000003, "r_x3": 50.112, "r_y3": 243.48657000000003, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.34813999999994, "r_x1": 286.36511, "r_y1": 264.34813999999994, "r_x2": 286.36511, "r_y2": 255.44159000000002, "r_x3": 50.112, "r_y3": 255.44159000000002, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.30316000000005, "r_x1": 286.36502, "r_y1": 276.30316000000005, "r_x2": 286.36502, "r_y2": 267.39661, "r_x3": 50.112, "r_y3": 267.39661, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.25815, "r_x1": 286.36508, "r_y1": 288.25815, "r_x2": 286.36508, "r_y2": 279.35155999999995, "r_x3": 50.112, "r_y3": 279.35155999999995, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.21414, "r_x1": 88.567635, "r_y1": 300.21414, "r_x2": 88.567635, "r_y2": 291.30759, "r_x3": 50.112, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.501602, "r_y0": 300.21414, "r_x1": 286.36505, "r_y1": 300.21414, "r_x2": 286.36505, "r_y2": 291.30759, "r_x3": 95.501602, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.16913, "r_x1": 286.36508, "r_y1": 312.16913, "r_x2": 286.36508, "r_y2": 303.26257, "r_x3": 50.112, "r_y3": 303.26257, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.12411, "r_x1": 286.36511, "r_y1": 324.12411, "r_x2": 286.36511, "r_y2": 315.21756, "r_x3": 50.112, "r_y3": 315.21756, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.0791, "r_x1": 286.36505, "r_y1": 336.0791, "r_x2": 286.36505, "r_y2": 327.17255, "r_x3": 50.112, "r_y3": 327.17255, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.03409, "r_x1": 286.36511, "r_y1": 348.03409, "r_x2": 286.36511, "r_y2": 339.12753, "r_x3": 50.112, "r_y3": 339.12753, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.99008, "r_x1": 286.36508, "r_y1": 359.99008, "r_x2": 286.36508, "r_y2": 351.08353, "r_x3": 50.112, "r_y3": 351.08353, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.94507, "r_x1": 76.951241, "r_y1": 371.94507, "r_x2": 76.951241, "r_y2": 363.03851, "r_x3": 50.112, "r_y3": 363.03851, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 384.35306, "r_x1": 286.36499, "r_y1": 384.35306, "r_x2": 286.36499, "r_y2": 375.4465, "r_x3": 62.067001, "r_y3": 375.4465, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.30804, "r_x1": 120.98594, "r_y1": 396.30804, "r_x2": 120.98594, "r_y2": 387.40149, "r_x3": 50.112, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.901, "r_y0": 396.23830999999996, "r_x1": 179.7314, "r_y1": 396.23830999999996, "r_x2": 179.7314, "r_y2": 387.28192, "r_x3": 123.901, "r_y3": 387.28192, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.646, "r_y0": 396.30804, "r_x1": 286.36658, "r_y1": 396.30804, "r_x2": 286.36658, "r_y2": 387.40149, "r_x3": 182.646, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 408.26302999999996, "r_x1": 181.75778, "r_y1": 408.26302999999996, "r_x2": 181.75778, "r_y2": 399.35648, "r_x3": 50.112, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.104, "r_y0": 408.1933, "r_x1": 240.2034, "r_y1": 408.1933, "r_x2": 240.2034, "r_y2": 399.23690999999997, "r_x3": 184.104, "r_y3": 399.23690999999997, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.20401, "r_y0": 408.26302999999996, "r_x1": 286.36069, "r_y1": 408.26302999999996, "r_x2": 286.36069, "r_y2": 399.35648, "r_x3": 240.20401, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 420.21802, "r_x1": 286.36511, "r_y1": 420.21802, "r_x2": 286.36511, "r_y2": 411.31146, "r_x3": 50.112015, "r_y3": 411.31146, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 432.173, "r_x1": 82.520355, "r_y1": 432.173, "r_x2": 82.520355, "r_y2": 423.26645, "r_x3": 50.112015, "r_y3": 423.26645, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 453.45801, "r_x1": 70.741714, "r_y1": 453.45801, "r_x2": 70.741714, "r_y2": 444.55145, "r_x3": 61.569016, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.034889, "r_y0": 453.45801, "r_x1": 117.10054, "r_y1": 453.45801, "r_x2": 117.10054, "r_y2": 444.55145, "r_x3": 73.034889, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59001, "r_y0": 453.38828, "r_x1": 175.42041, "r_y1": 453.38828, "r_x2": 175.42041, "r_y2": 444.43188, "r_x3": 119.59001, "r_y3": 444.43188, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42102, "r_y0": 453.45801, "r_x1": 286.36453, "r_y1": 453.45801, "r_x2": 286.36453, "r_y2": 444.55145, "r_x3": 175.42102, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 465.41299, "r_x1": 286.3649, "r_y1": 465.41299, "r_x2": 286.3649, "r_y2": 456.50644000000005, "r_x3": 70.037018, "r_y3": 456.50644000000005, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 477.36798, "r_x1": 286.3649, "r_y1": 477.36798, "r_x2": 286.3649, "r_y2": 468.46143, "r_x3": 70.037018, "r_y3": 468.46143, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 489.32297, "r_x1": 99.635902, "r_y1": 489.32297, "r_x2": 99.635902, "r_y2": 480.41641, "r_x3": 70.037018, "r_y3": 480.41641, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 511.05997, "r_x1": 71.619438, "r_y1": 511.05997, "r_x2": 71.619438, "r_y2": 502.15341, "r_x3": 61.569016, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.132042, "r_y0": 511.05997, "r_x1": 196.10396, "r_y1": 511.05997, "r_x2": 196.10396, "r_y2": 502.15341, "r_x3": 74.132042, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31001, "r_y0": 510.99023, "r_x1": 256.14041, "r_y1": 510.99023, "r_x2": 256.14041, "r_y2": 502.03384, "r_x3": 200.31001, "r_y3": 502.03384, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35001, "r_y0": 511.05997, "r_x1": 286.36237, "r_y1": 511.05997, "r_x2": 286.36237, "r_y2": 502.15341, "r_x3": 260.35001, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 523.01495, "r_x1": 286.3649, "r_y1": 523.01495, "r_x2": 286.3649, "r_y2": 514.1084000000001, "r_x3": 70.037003, "r_y3": 514.1084000000001, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 534.97095, "r_x1": 286.36487, "r_y1": 534.97095, "r_x2": 286.36487, "r_y2": 526.06439, "r_x3": 70.037003, "r_y3": 526.06439, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 546.9259500000001, "r_x1": 161.65305, "r_y1": 546.9259500000001, "r_x2": 161.65305, "r_y2": 538.0193899999999, "r_x3": 70.037003, "r_y3": 538.0193899999999, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 568.66295, "r_x1": 71.115913, "r_y1": 568.66295, "r_x2": 71.115913, "r_y2": 559.75639, "r_x3": 61.569, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.502647, "r_y0": 568.66295, "r_x1": 116.71199, "r_y1": 568.66295, "r_x2": 116.71199, "r_y2": 559.75639, "r_x3": 73.502647, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.583, "r_y0": 568.59322, "r_x1": 177.68239, "r_y1": 568.59322, "r_x2": 177.68239, "r_y2": 559.63684, "r_x3": 121.583, "r_y3": 559.63684, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55301, "r_y0": 568.66295, "r_x1": 286.36328, "r_y1": 568.66295, "r_x2": 286.36328, "r_y2": 559.75639, "r_x3": 182.55301, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 580.6179500000001, "r_x1": 286.36493, "r_y1": 580.6179500000001, "r_x2": 286.36493, "r_y2": 571.7114, "r_x3": 70.03701, "r_y3": 571.7114, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 592.57295, "r_x1": 82.400597, "r_y1": 592.57295, "r_x2": 82.400597, "r_y2": 583.6664000000001, "r_x3": 70.03701, "r_y3": 583.6664000000001, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569008000000004, "r_y0": 614.30995, "r_x1": 72.332527, "r_y1": 614.30995, "r_x2": 72.332527, "r_y2": 605.4034, "r_x3": 61.569008000000004, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.023399, "r_y0": 614.30995, "r_x1": 286.36508, "r_y1": 614.30995, "r_x2": 286.36508, "r_y2": 605.4034, "r_x3": 75.023399, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 626.26495, "r_x1": 286.36487, "r_y1": 626.26495, "r_x2": 286.36487, "r_y2": 617.3584, "r_x3": 70.03701, "r_y3": 617.3584, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 638.22095, "r_x1": 198.05641, "r_y1": 638.22095, "r_x2": 198.05641, "r_y2": 629.31439, "r_x3": 70.03701, "r_y3": 629.31439, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067009000000006, "r_y0": 659.50494, "r_x1": 286.36496, "r_y1": 659.50494, "r_x2": 286.36496, "r_y2": 650.59839, "r_x3": 62.067009000000006, "r_y3": 650.59839, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 671.45995, "r_x1": 286.36511, "r_y1": 671.45995, "r_x2": 286.36511, "r_y2": 662.55339, "r_x3": 50.112007, "r_y3": 662.55339, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 683.41496, "r_x1": 286.36511, "r_y1": 683.41496, "r_x2": 286.36511, "r_y2": 674.50839, "r_x3": 50.112007, "r_y3": 674.50839, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 695.369957, "r_x1": 286.36511, "r_y1": 695.369957, "r_x2": 286.36511, "r_y2": 686.46339, "r_x3": 50.112007, "r_y3": 686.46339, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97100100000001, "r_y0": 712.721542, "r_x1": 183.73055, "r_y1": 712.721542, "r_x2": 183.73055, "r_y2": 705.596275, "r_x3": 60.97100100000001, "r_y3": 705.596275, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 545.11511, "r_y1": 84.11492999999996, "r_x2": 545.11511, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11505, "r_y1": 96.06994999999995, "r_x2": 545.11505, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 508.08417000000003, "r_y1": 108.02495999999985, "r_x2": 508.08417000000003, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 132.47968000000003, "r_x1": 315.5831, "r_y1": 132.47968000000003, "r_x2": 315.5831, "r_y2": 121.73193000000003, "r_x3": 308.862, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54456, "r_y0": 132.47968000000003, "r_x1": 498.28021, "r_y1": 132.47968000000003, "r_x2": 498.28021, "r_y2": 121.73193000000003, "r_x3": 324.54456, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 151.12793, "r_x1": 545.11493, "r_y1": 151.12793, "r_x2": 545.11493, "r_y2": 142.22136999999998, "r_x3": 320.81699, "r_y3": 142.22136999999998, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 163.08294999999998, "r_x1": 545.11505, "r_y1": 163.08294999999998, "r_x2": 545.11505, "r_y2": 154.17638999999997, "r_x3": 308.862, "r_y3": 154.17638999999997, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 175.03796, "r_x1": 522.55975, "r_y1": 175.03796, "r_x2": 522.55975, "r_y2": 166.13140999999996, "r_x3": 308.862, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 175.03796, "r_x1": 545.11505, "r_y1": 175.03796, "r_x2": 545.11505, "r_y2": 166.13140999999996, "r_x3": 529.62323, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 186.99298, "r_x1": 545.11517, "r_y1": 186.99298, "r_x2": 545.11517, "r_y2": 178.08642999999995, "r_x3": 308.862, "r_y3": 178.08642999999995, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 198.94799999999998, "r_x1": 545.11511, "r_y1": 198.94799999999998, "r_x2": 545.11511, "r_y2": 190.04143999999997, "r_x3": 308.862, "r_y3": 190.04143999999997, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 210.90301999999997, "r_x1": 346.97891, "r_y1": 210.90301999999997, "r_x2": 346.97891, "r_y2": 201.99645999999996, "r_x3": 308.862, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.86929, "r_y0": 210.90301999999997, "r_x1": 545.11511, "r_y1": 210.90301999999997, "r_x2": 545.11511, "r_y2": 201.99645999999996, "r_x3": 354.86929, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 222.85901, "r_x1": 545.11505, "r_y1": 222.85901, "r_x2": 545.11505, "r_y2": 213.95245, "r_x3": 308.862, "r_y3": 213.95245, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 234.81403, "r_x1": 530.9184, "r_y1": 234.81403, "r_x2": 530.9184, "r_y2": 225.90747, "r_x3": 308.862, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92212, "r_y0": 234.81403, "r_x1": 545.11511, "r_y1": 234.81403, "r_x2": 545.11511, "r_y2": 225.90747, "r_x3": 537.92212, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 246.76904000000002, "r_x1": 545.11517, "r_y1": 246.76904000000002, "r_x2": 545.11517, "r_y2": 237.86248999999998, "r_x3": 308.862, "r_y3": 237.86248999999998, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.72406, "r_x1": 545.11511, "r_y1": 258.72406, "r_x2": 545.11511, "r_y2": 249.8175, "r_x3": 308.862, "r_y3": 249.8175, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.67908, "r_x1": 439.8402699999999, "r_y1": 270.67908, "r_x2": 439.8402699999999, "r_y2": 261.77252, "r_x3": 308.862, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.43999999999994, "r_y0": 270.45989999999995, "r_x1": 452.1889, "r_y1": 270.45989999999995, "r_x2": 452.1889, "r_y2": 261.61310000000003, "r_x3": 444.43999999999994, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89001, "r_y0": 270.45989999999995, "r_x1": 470.83392000000003, "r_y1": 270.45989999999995, "r_x2": 470.83392000000003, "r_y2": 261.61310000000003, "r_x3": 455.89001, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83401, "r_y0": 270.67908, "r_x1": 545.11517, "r_y1": 270.67908, "r_x2": 545.11517, "r_y2": 261.77252, "r_x3": 470.83401, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.63406, "r_x1": 545.11511, "r_y1": 282.63406, "r_x2": 545.11511, "r_y2": 273.72748, "r_x3": 308.862, "r_y3": 273.72748, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.59006, "r_x1": 545.11511, "r_y1": 294.59006, "r_x2": 545.11511, "r_y2": 285.6835, "r_x3": 308.862, "r_y3": 285.6835, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 306.54504, "r_x1": 545.11511, "r_y1": 306.54504, "r_x2": 545.11511, "r_y2": 297.63849, "r_x3": 308.862, "r_y3": 297.63849, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 318.50003000000004, "r_x1": 545.11517, "r_y1": 318.50003000000004, "r_x2": 545.11517, "r_y2": 309.59348, "r_x3": 308.862, "r_y3": 309.59348, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 330.45502, "r_x1": 425.92255, "r_y1": 330.45502, "r_x2": 425.92255, "r_y2": 321.54846, "r_x3": 308.862, "r_y3": 321.54846, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 342.47601, "r_x1": 545.11499, "r_y1": 342.47601, "r_x2": 545.11499, "r_y2": 333.56946, "r_x3": 320.81699, "r_y3": 333.56946, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 354.43100000000004, "r_x1": 545.11499, "r_y1": 354.43100000000004, "r_x2": 545.11499, "r_y2": 345.52444, "r_x3": 308.862, "r_y3": 345.52444, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 366.38599, "r_x1": 545.11517, "r_y1": 366.38599, "r_x2": 545.11517, "r_y2": 357.47943, "r_x3": 308.862, "r_y3": 357.47943, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 378.34198, "r_x1": 545.11511, "r_y1": 378.34198, "r_x2": 545.11511, "r_y2": 369.43542, "r_x3": 308.862, "r_y3": 369.43542, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 390.29697, "r_x1": 545.11505, "r_y1": 390.29697, "r_x2": 545.11505, "r_y2": 381.39041, "r_x3": 308.862, "r_y3": 381.39041, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 402.25195, "r_x1": 545.11505, "r_y1": 402.25195, "r_x2": 545.11505, "r_y2": 393.3453999999999, "r_x3": 308.862, "r_y3": 393.3453999999999, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 414.20694, "r_x1": 545.11517, "r_y1": 414.20694, "r_x2": 545.11517, "r_y2": 405.30038, "r_x3": 308.862, "r_y3": 405.30038, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 426.16193, "r_x1": 545.11523, "r_y1": 426.16193, "r_x2": 545.11523, "r_y2": 417.25537, "r_x3": 308.862, "r_y3": 417.25537, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 438.11792, "r_x1": 545.11511, "r_y1": 438.11792, "r_x2": 545.11511, "r_y2": 429.21136000000007, "r_x3": 308.862, "r_y3": 429.21136000000007, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 450.0729099999999, "r_x1": 401.28503, "r_y1": 450.0729099999999, "r_x2": 401.28503, "r_y2": 441.16635, "r_x3": 308.862, "r_y3": 441.16635, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 462.02417, "r_x1": 423.26236, "r_y1": 462.02417, "r_x2": 423.26236, "r_y2": 453.06778, "r_x3": 320.81699, "r_y3": 453.06778, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.26697, "r_y0": 462.0939, "r_x1": 545.10956, "r_y1": 462.0939, "r_x2": 545.10956, "r_y2": 453.18735, "r_x3": 423.26697, "r_y3": 453.18735, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 474.04889, "r_x1": 545.11511, "r_y1": 474.04889, "r_x2": 545.11511, "r_y2": 465.14233, "r_x3": 308.86197, "r_y3": 465.14233, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 486.00388, "r_x1": 335.7012, "r_y1": 486.00388, "r_x2": 335.7012, "r_y2": 477.09732, "r_x3": 308.86197, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85309, "r_y0": 486.00388, "r_x1": 545.11505, "r_y1": 486.00388, "r_x2": 545.11505, "r_y2": 477.09732, "r_x3": 345.85309, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.95886, "r_x1": 545.11493, "r_y1": 497.95886, "r_x2": 545.11493, "r_y2": 489.05231, "r_x3": 308.86197, "r_y3": 489.05231, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.91385, "r_x1": 545.11499, "r_y1": 509.91385, "r_x2": 545.11499, "r_y2": 501.00729, "r_x3": 308.86197, "r_y3": 501.00729, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.8698400000001, "r_x1": 545.11505, "r_y1": 521.8698400000001, "r_x2": 545.11505, "r_y2": 512.9632899999999, "r_x3": 308.86197, "r_y3": 512.9632899999999, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.82483, "r_x1": 545.11505, "r_y1": 533.82483, "r_x2": 545.11505, "r_y2": 524.91827, "r_x3": 308.86197, "r_y3": 524.91827, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.77983, "r_x1": 420.94119, "r_y1": 545.77983, "r_x2": 420.94119, "r_y2": 536.87328, "r_x3": 308.86197, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59497, "r_y0": 545.56065, "r_x1": 433.5575600000001, "r_y1": 545.56065, "r_x2": 433.5575600000001, "r_y2": 536.1559599999999, "r_x3": 423.59497, "r_y3": 536.1559599999999, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21198, "r_y0": 545.77983, "r_x1": 545.11316, "r_y1": 545.77983, "r_x2": 545.11316, "r_y2": 536.87328, "r_x3": 436.21198, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 557.73483, "r_x1": 545.11511, "r_y1": 557.73483, "r_x2": 545.11511, "r_y2": 548.82828, "r_x3": 308.86197, "r_y3": 548.82828, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 569.68983, "r_x1": 545.11493, "r_y1": 569.68983, "r_x2": 545.11493, "r_y2": 560.78328, "r_x3": 308.86197, "r_y3": 560.78328, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 581.6448399999999, "r_x1": 545.11499, "r_y1": 581.6448399999999, "r_x2": 545.11499, "r_y2": 572.73828, "r_x3": 308.86197, "r_y3": 572.73828, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 593.60083, "r_x1": 545.11505, "r_y1": 593.60083, "r_x2": 545.11505, "r_y2": 584.69427, "r_x3": 308.86197, "r_y3": 584.69427, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 605.55583, "r_x1": 497.07541, "r_y1": 605.55583, "r_x2": 497.07541, "r_y2": 596.6492800000001, "r_x3": 308.86197, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.80496, "r_y0": 605.33665, "r_x1": 509.76755, "r_y1": 605.33665, "r_x2": 509.76755, "r_y2": 595.93196, "r_x3": 499.80496, "r_y3": 595.93196, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.50098, "r_y0": 605.55583, "r_x1": 545.10852, "r_y1": 605.55583, "r_x2": 545.10852, "r_y2": 596.6492800000001, "r_x3": 512.50098, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 617.5108299999999, "r_x1": 545.11511, "r_y1": 617.5108299999999, "r_x2": 545.11511, "r_y2": 608.60428, "r_x3": 308.86197, "r_y3": 608.60428, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.46584, "r_x1": 545.11505, "r_y1": 629.46584, "r_x2": 545.11505, "r_y2": 620.55928, "r_x3": 308.86197, "r_y3": 620.55928, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.42084, "r_x1": 364.78201, "r_y1": 641.42084, "r_x2": 364.78201, "r_y2": 632.51428, "r_x3": 308.86197, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57397, "r_y0": 641.1917, "r_x1": 415.61362, "r_y1": 641.1917, "r_x2": 415.61362, "r_y2": 632.60394, "r_x3": 367.57397, "r_y3": 632.60394, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61298, "r_y0": 641.42084, "r_x1": 545.11688, "r_y1": 641.42084, "r_x2": 545.11688, "r_y2": 632.51428, "r_x3": 415.61298, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.37584, "r_x1": 545.11511, "r_y1": 653.37584, "r_x2": 545.11511, "r_y2": 644.46928, "r_x3": 308.86197, "r_y3": 644.46928, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 665.1027, "r_x1": 373.59894, "r_y1": 665.1027, "r_x2": 373.59894, "r_y2": 656.51494, "r_x3": 308.86197, "r_y3": 656.51494, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.90698, "r_y0": 665.33184, "r_x1": 545.11548, "r_y1": 665.33184, "r_x2": 545.11548, "r_y2": 656.4252799999999, "r_x3": 376.90698, "r_y3": 656.4252799999999, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28684, "r_x1": 545.11517, "r_y1": 677.28684, "r_x2": 545.11517, "r_y2": 668.38028, "r_x3": 308.862, "r_y3": 668.38028, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.0127, "r_x1": 356.90164, "r_y1": 689.0127, "r_x2": 356.90164, "r_y2": 680.42494, "r_x3": 308.862, "r_y3": 680.42494, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13101, "r_y0": 689.24184, "r_x1": 545.1153, "r_y1": 689.24184, "r_x2": 545.1153, "r_y2": 680.33528, "r_x3": 357.13101, "r_y3": 680.33528, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196846, "r_x1": 545.11511, "r_y1": 701.196846, "r_x2": 545.11511, "r_y2": 692.290283, "r_x3": 308.862, "r_y3": 692.290283, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151848, "r_x1": 545.11517, "r_y1": 713.151848, "r_x2": 545.11517, "r_y2": 704.245285, "r_x3": 308.862, "r_y3": 704.245285, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039845, "r_x1": 300.10229, "r_y1": 743.039845, "r_x2": 300.10229, "r_y2": 734.133282, "r_x3": 295.121, "r_y3": 734.133282, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 12, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36505, "b": 96.06994999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9656890034675598, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36505, "r_y1": 84.11492999999996, "r_x2": 286.36505, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 112.64721999999999, "r_y1": 96.06994999999995, "r_x2": 112.64721999999999, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 99.57141000000001, "r": 286.36514, "b": 228.03008999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9838606119155884, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 108.47797000000003, "r_x1": 286.36496, "r_y1": 108.47797000000003, "r_x2": 286.36496, "r_y2": 99.57141000000001, "r_x3": 62.067001, "r_y3": 99.57141000000001, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.43297999999993, "r_x1": 74.749512, "r_y1": 120.43297999999993, "r_x2": 74.749512, "r_y2": 111.52643, "r_x3": 50.112, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.334793, "r_y0": 120.43297999999993, "r_x1": 286.36514, "r_y1": 120.43297999999993, "r_x2": 286.36514, "r_y2": 111.52643, "r_x3": 81.334793, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 132.38800000000003, "r_x1": 286.36511, "r_y1": 132.38800000000003, "r_x2": 286.36511, "r_y2": 123.48145, "r_x3": 50.112, "r_y3": 123.48145, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 144.34302000000002, "r_x1": 286.36511, "r_y1": 144.34302000000002, "r_x2": 286.36511, "r_y2": 135.43646, "r_x3": 50.112, "r_y3": 135.43646, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 156.29900999999995, "r_x1": 286.36505, "r_y1": 156.29900999999995, "r_x2": 286.36505, "r_y2": 147.39246000000003, "r_x3": 50.112, "r_y3": 147.39246000000003, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 168.25402999999994, "r_x1": 286.36511, "r_y1": 168.25402999999994, "r_x2": 286.36511, "r_y2": 159.34747000000004, "r_x3": 50.112, "r_y3": 159.34747000000004, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.20905000000005, "r_x1": 286.36508, "r_y1": 180.20905000000005, "r_x2": 286.36508, "r_y2": 171.30249000000003, "r_x3": 50.112, "r_y3": 171.30249000000003, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.16405999999995, "r_x1": 286.36511, "r_y1": 192.16405999999995, "r_x2": 286.36511, "r_y2": 183.25751000000002, "r_x3": 50.112, "r_y3": 183.25751000000002, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.11908000000005, "r_x1": 286.36508, "r_y1": 204.11908000000005, "r_x2": 286.36508, "r_y2": 195.21252000000004, "r_x3": 50.112, "r_y3": 195.21252000000004, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.07410000000004, "r_x1": 286.36514, "r_y1": 216.07410000000004, "r_x2": 286.36514, "r_y2": 207.16754000000003, "r_x3": 50.112, "r_y3": 207.16754000000003, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.03008999999997, "r_x1": 278.66397, "r_y1": 228.03008999999997, "r_x2": 278.66397, "r_y2": 219.12354000000005, "r_x3": 50.112, "r_y3": 219.12354000000005, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.112, "t": 231.53156, "r": 286.36511, "b": 371.94507, "coord_origin": "TOPLEFT" }, "confidence": 0.9855920076370239, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 240.43811000000005, "r_x1": 286.36493, "r_y1": 240.43811000000005, "r_x2": 286.36493, "r_y2": 231.53156, "r_x3": 62.067001, "r_y3": 231.53156, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 252.39313000000004, "r_x1": 286.36511, "r_y1": 252.39313000000004, "r_x2": 286.36511, "r_y2": 243.48657000000003, "r_x3": 50.112, "r_y3": 243.48657000000003, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.34813999999994, "r_x1": 286.36511, "r_y1": 264.34813999999994, "r_x2": 286.36511, "r_y2": 255.44159000000002, "r_x3": 50.112, "r_y3": 255.44159000000002, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.30316000000005, "r_x1": 286.36502, "r_y1": 276.30316000000005, "r_x2": 286.36502, "r_y2": 267.39661, "r_x3": 50.112, "r_y3": 267.39661, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.25815, "r_x1": 286.36508, "r_y1": 288.25815, "r_x2": 286.36508, "r_y2": 279.35155999999995, "r_x3": 50.112, "r_y3": 279.35155999999995, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.21414, "r_x1": 88.567635, "r_y1": 300.21414, "r_x2": 88.567635, "r_y2": 291.30759, "r_x3": 50.112, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.501602, "r_y0": 300.21414, "r_x1": 286.36505, "r_y1": 300.21414, "r_x2": 286.36505, "r_y2": 291.30759, "r_x3": 95.501602, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.16913, "r_x1": 286.36508, "r_y1": 312.16913, "r_x2": 286.36508, "r_y2": 303.26257, "r_x3": 50.112, "r_y3": 303.26257, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.12411, "r_x1": 286.36511, "r_y1": 324.12411, "r_x2": 286.36511, "r_y2": 315.21756, "r_x3": 50.112, "r_y3": 315.21756, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.0791, "r_x1": 286.36505, "r_y1": 336.0791, "r_x2": 286.36505, "r_y2": 327.17255, "r_x3": 50.112, "r_y3": 327.17255, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.03409, "r_x1": 286.36511, "r_y1": 348.03409, "r_x2": 286.36511, "r_y2": 339.12753, "r_x3": 50.112, "r_y3": 339.12753, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.99008, "r_x1": 286.36508, "r_y1": 359.99008, "r_x2": 286.36508, "r_y2": 351.08353, "r_x3": 50.112, "r_y3": 351.08353, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.94507, "r_x1": 76.951241, "r_y1": 371.94507, "r_x2": 76.951241, "r_y2": 363.03851, "r_x3": 50.112, "r_y3": 363.03851, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 50.112, "t": 375.4465, "r": 286.36658, "b": 432.173, "coord_origin": "TOPLEFT" }, "confidence": 0.9820111393928528, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 384.35306, "r_x1": 286.36499, "r_y1": 384.35306, "r_x2": 286.36499, "r_y2": 375.4465, "r_x3": 62.067001, "r_y3": 375.4465, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.30804, "r_x1": 120.98594, "r_y1": 396.30804, "r_x2": 120.98594, "r_y2": 387.40149, "r_x3": 50.112, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.901, "r_y0": 396.23830999999996, "r_x1": 179.7314, "r_y1": 396.23830999999996, "r_x2": 179.7314, "r_y2": 387.28192, "r_x3": 123.901, "r_y3": 387.28192, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.646, "r_y0": 396.30804, "r_x1": 286.36658, "r_y1": 396.30804, "r_x2": 286.36658, "r_y2": 387.40149, "r_x3": 182.646, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 408.26302999999996, "r_x1": 181.75778, "r_y1": 408.26302999999996, "r_x2": 181.75778, "r_y2": 399.35648, "r_x3": 50.112, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.104, "r_y0": 408.1933, "r_x1": 240.2034, "r_y1": 408.1933, "r_x2": 240.2034, "r_y2": 399.23690999999997, "r_x3": 184.104, "r_y3": 399.23690999999997, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.20401, "r_y0": 408.26302999999996, "r_x1": 286.36069, "r_y1": 408.26302999999996, "r_x2": 286.36069, "r_y2": 399.35648, "r_x3": 240.20401, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 420.21802, "r_x1": 286.36511, "r_y1": 420.21802, "r_x2": 286.36511, "r_y2": 411.31146, "r_x3": 50.112015, "r_y3": 411.31146, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 432.173, "r_x1": 82.520355, "r_y1": 432.173, "r_x2": 82.520355, "r_y2": 423.26645, "r_x3": 50.112015, "r_y3": 423.26645, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 61.569016, "t": 444.43188, "r": 286.3649, "b": 489.32297, "coord_origin": "TOPLEFT" }, "confidence": 0.9822162389755249, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 453.45801, "r_x1": 70.741714, "r_y1": 453.45801, "r_x2": 70.741714, "r_y2": 444.55145, "r_x3": 61.569016, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.034889, "r_y0": 453.45801, "r_x1": 117.10054, "r_y1": 453.45801, "r_x2": 117.10054, "r_y2": 444.55145, "r_x3": 73.034889, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59001, "r_y0": 453.38828, "r_x1": 175.42041, "r_y1": 453.38828, "r_x2": 175.42041, "r_y2": 444.43188, "r_x3": 119.59001, "r_y3": 444.43188, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42102, "r_y0": 453.45801, "r_x1": 286.36453, "r_y1": 453.45801, "r_x2": 286.36453, "r_y2": 444.55145, "r_x3": 175.42102, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 465.41299, "r_x1": 286.3649, "r_y1": 465.41299, "r_x2": 286.3649, "r_y2": 456.50644000000005, "r_x3": 70.037018, "r_y3": 456.50644000000005, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 477.36798, "r_x1": 286.3649, "r_y1": 477.36798, "r_x2": 286.3649, "r_y2": 468.46143, "r_x3": 70.037018, "r_y3": 468.46143, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 489.32297, "r_x1": 99.635902, "r_y1": 489.32297, "r_x2": 99.635902, "r_y2": 480.41641, "r_x3": 70.037018, "r_y3": 480.41641, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 61.569016, "t": 502.03384, "r": 286.3649, "b": 546.9259500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.982271671295166, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 511.05997, "r_x1": 71.619438, "r_y1": 511.05997, "r_x2": 71.619438, "r_y2": 502.15341, "r_x3": 61.569016, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.132042, "r_y0": 511.05997, "r_x1": 196.10396, "r_y1": 511.05997, "r_x2": 196.10396, "r_y2": 502.15341, "r_x3": 74.132042, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31001, "r_y0": 510.99023, "r_x1": 256.14041, "r_y1": 510.99023, "r_x2": 256.14041, "r_y2": 502.03384, "r_x3": 200.31001, "r_y3": 502.03384, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35001, "r_y0": 511.05997, "r_x1": 286.36237, "r_y1": 511.05997, "r_x2": 286.36237, "r_y2": 502.15341, "r_x3": 260.35001, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 523.01495, "r_x1": 286.3649, "r_y1": 523.01495, "r_x2": 286.3649, "r_y2": 514.1084000000001, "r_x3": 70.037003, "r_y3": 514.1084000000001, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 534.97095, "r_x1": 286.36487, "r_y1": 534.97095, "r_x2": 286.36487, "r_y2": 526.06439, "r_x3": 70.037003, "r_y3": 526.06439, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 546.9259500000001, "r_x1": 161.65305, "r_y1": 546.9259500000001, "r_x2": 161.65305, "r_y2": 538.0193899999999, "r_x3": 70.037003, "r_y3": 538.0193899999999, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 61.569, "t": 559.63684, "r": 286.36493, "b": 592.57295, "coord_origin": "TOPLEFT" }, "confidence": 0.9802963733673096, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 568.66295, "r_x1": 71.115913, "r_y1": 568.66295, "r_x2": 71.115913, "r_y2": 559.75639, "r_x3": 61.569, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.502647, "r_y0": 568.66295, "r_x1": 116.71199, "r_y1": 568.66295, "r_x2": 116.71199, "r_y2": 559.75639, "r_x3": 73.502647, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.583, "r_y0": 568.59322, "r_x1": 177.68239, "r_y1": 568.59322, "r_x2": 177.68239, "r_y2": 559.63684, "r_x3": 121.583, "r_y3": 559.63684, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55301, "r_y0": 568.66295, "r_x1": 286.36328, "r_y1": 568.66295, "r_x2": 286.36328, "r_y2": 559.75639, "r_x3": 182.55301, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 580.6179500000001, "r_x1": 286.36493, "r_y1": 580.6179500000001, "r_x2": 286.36493, "r_y2": 571.7114, "r_x3": 70.03701, "r_y3": 571.7114, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 592.57295, "r_x1": 82.400597, "r_y1": 592.57295, "r_x2": 82.400597, "r_y2": 583.6664000000001, "r_x3": 70.03701, "r_y3": 583.6664000000001, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 61.569008000000004, "t": 605.4034, "r": 286.36508, "b": 638.22095, "coord_origin": "TOPLEFT" }, "confidence": 0.9806395173072815, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569008000000004, "r_y0": 614.30995, "r_x1": 72.332527, "r_y1": 614.30995, "r_x2": 72.332527, "r_y2": 605.4034, "r_x3": 61.569008000000004, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.023399, "r_y0": 614.30995, "r_x1": 286.36508, "r_y1": 614.30995, "r_x2": 286.36508, "r_y2": 605.4034, "r_x3": 75.023399, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 626.26495, "r_x1": 286.36487, "r_y1": 626.26495, "r_x2": 286.36487, "r_y2": 617.3584, "r_x3": 70.03701, "r_y3": 617.3584, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 638.22095, "r_x1": 198.05641, "r_y1": 638.22095, "r_x2": 198.05641, "r_y2": 629.31439, "r_x3": 70.03701, "r_y3": 629.31439, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 50.112007, "t": 650.59839, "r": 286.36511, "b": 695.369957, "coord_origin": "TOPLEFT" }, "confidence": 0.9742533564567566, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067009000000006, "r_y0": 659.50494, "r_x1": 286.36496, "r_y1": 659.50494, "r_x2": 286.36496, "r_y2": 650.59839, "r_x3": 62.067009000000006, "r_y3": 650.59839, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 671.45995, "r_x1": 286.36511, "r_y1": 671.45995, "r_x2": 286.36511, "r_y2": 662.55339, "r_x3": 50.112007, "r_y3": 662.55339, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 683.41496, "r_x1": 286.36511, "r_y1": 683.41496, "r_x2": 286.36511, "r_y2": 674.50839, "r_x3": 50.112007, "r_y3": 674.50839, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 695.369957, "r_x1": 286.36511, "r_y1": 695.369957, "r_x2": 286.36511, "r_y2": 686.46339, "r_x3": 50.112007, "r_y3": 686.46339, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "footnote", "bbox": { "l": 60.97100100000001, "t": 705.596275, "r": 183.73055, "b": 712.721542, "coord_origin": "TOPLEFT" }, "confidence": 0.895367443561554, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97100100000001, "r_y0": 712.721542, "r_x1": 183.73055, "r_y1": 712.721542, "r_x2": 183.73055, "r_y2": 705.596275, "r_x3": 60.97100100000001, "r_y3": 705.596275, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "text", "bbox": { "l": 308.862, "t": 75.20836999999995, "r": 545.11511, "b": 108.02495999999985, "coord_origin": "TOPLEFT" }, "confidence": 0.9774322509765625, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 545.11511, "r_y1": 84.11492999999996, "r_x2": 545.11511, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11505, "r_y1": 96.06994999999995, "r_x2": 545.11505, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 508.08417000000003, "r_y1": 108.02495999999985, "r_x2": 508.08417000000003, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 308.862, "t": 121.73193000000003, "r": 498.28021, "b": 132.47968000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9428724646568298, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 132.47968000000003, "r_x1": 315.5831, "r_y1": 132.47968000000003, "r_x2": 315.5831, "r_y2": 121.73193000000003, "r_x3": 308.862, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54456, "r_y0": 132.47968000000003, "r_x1": 498.28021, "r_y1": 132.47968000000003, "r_x2": 498.28021, "r_y2": 121.73193000000003, "r_x3": 324.54456, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 142.22136999999998, "r": 545.11517, "b": 330.45502, "coord_origin": "TOPLEFT" }, "confidence": 0.987194836139679, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 151.12793, "r_x1": 545.11493, "r_y1": 151.12793, "r_x2": 545.11493, "r_y2": 142.22136999999998, "r_x3": 320.81699, "r_y3": 142.22136999999998, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 163.08294999999998, "r_x1": 545.11505, "r_y1": 163.08294999999998, "r_x2": 545.11505, "r_y2": 154.17638999999997, "r_x3": 308.862, "r_y3": 154.17638999999997, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 175.03796, "r_x1": 522.55975, "r_y1": 175.03796, "r_x2": 522.55975, "r_y2": 166.13140999999996, "r_x3": 308.862, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 175.03796, "r_x1": 545.11505, "r_y1": 175.03796, "r_x2": 545.11505, "r_y2": 166.13140999999996, "r_x3": 529.62323, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 186.99298, "r_x1": 545.11517, "r_y1": 186.99298, "r_x2": 545.11517, "r_y2": 178.08642999999995, "r_x3": 308.862, "r_y3": 178.08642999999995, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 198.94799999999998, "r_x1": 545.11511, "r_y1": 198.94799999999998, "r_x2": 545.11511, "r_y2": 190.04143999999997, "r_x3": 308.862, "r_y3": 190.04143999999997, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 210.90301999999997, "r_x1": 346.97891, "r_y1": 210.90301999999997, "r_x2": 346.97891, "r_y2": 201.99645999999996, "r_x3": 308.862, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.86929, "r_y0": 210.90301999999997, "r_x1": 545.11511, "r_y1": 210.90301999999997, "r_x2": 545.11511, "r_y2": 201.99645999999996, "r_x3": 354.86929, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 222.85901, "r_x1": 545.11505, "r_y1": 222.85901, "r_x2": 545.11505, "r_y2": 213.95245, "r_x3": 308.862, "r_y3": 213.95245, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 234.81403, "r_x1": 530.9184, "r_y1": 234.81403, "r_x2": 530.9184, "r_y2": 225.90747, "r_x3": 308.862, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92212, "r_y0": 234.81403, "r_x1": 545.11511, "r_y1": 234.81403, "r_x2": 545.11511, "r_y2": 225.90747, "r_x3": 537.92212, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 246.76904000000002, "r_x1": 545.11517, "r_y1": 246.76904000000002, "r_x2": 545.11517, "r_y2": 237.86248999999998, "r_x3": 308.862, "r_y3": 237.86248999999998, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.72406, "r_x1": 545.11511, "r_y1": 258.72406, "r_x2": 545.11511, "r_y2": 249.8175, "r_x3": 308.862, "r_y3": 249.8175, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.67908, "r_x1": 439.8402699999999, "r_y1": 270.67908, "r_x2": 439.8402699999999, "r_y2": 261.77252, "r_x3": 308.862, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.43999999999994, "r_y0": 270.45989999999995, "r_x1": 452.1889, "r_y1": 270.45989999999995, "r_x2": 452.1889, "r_y2": 261.61310000000003, "r_x3": 444.43999999999994, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89001, "r_y0": 270.45989999999995, "r_x1": 470.83392000000003, "r_y1": 270.45989999999995, "r_x2": 470.83392000000003, "r_y2": 261.61310000000003, "r_x3": 455.89001, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83401, "r_y0": 270.67908, "r_x1": 545.11517, "r_y1": 270.67908, "r_x2": 545.11517, "r_y2": 261.77252, "r_x3": 470.83401, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.63406, "r_x1": 545.11511, "r_y1": 282.63406, "r_x2": 545.11511, "r_y2": 273.72748, "r_x3": 308.862, "r_y3": 273.72748, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.59006, "r_x1": 545.11511, "r_y1": 294.59006, "r_x2": 545.11511, "r_y2": 285.6835, "r_x3": 308.862, "r_y3": 285.6835, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 306.54504, "r_x1": 545.11511, "r_y1": 306.54504, "r_x2": 545.11511, "r_y2": 297.63849, "r_x3": 308.862, "r_y3": 297.63849, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 318.50003000000004, "r_x1": 545.11517, "r_y1": 318.50003000000004, "r_x2": 545.11517, "r_y2": 309.59348, "r_x3": 308.862, "r_y3": 309.59348, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 330.45502, "r_x1": 425.92255, "r_y1": 330.45502, "r_x2": 425.92255, "r_y2": 321.54846, "r_x3": 308.862, "r_y3": 321.54846, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.862, "t": 333.56946, "r": 545.11523, "b": 450.0729099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9869040250778198, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 342.47601, "r_x1": 545.11499, "r_y1": 342.47601, "r_x2": 545.11499, "r_y2": 333.56946, "r_x3": 320.81699, "r_y3": 333.56946, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 354.43100000000004, "r_x1": 545.11499, "r_y1": 354.43100000000004, "r_x2": 545.11499, "r_y2": 345.52444, "r_x3": 308.862, "r_y3": 345.52444, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 366.38599, "r_x1": 545.11517, "r_y1": 366.38599, "r_x2": 545.11517, "r_y2": 357.47943, "r_x3": 308.862, "r_y3": 357.47943, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 378.34198, "r_x1": 545.11511, "r_y1": 378.34198, "r_x2": 545.11511, "r_y2": 369.43542, "r_x3": 308.862, "r_y3": 369.43542, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 390.29697, "r_x1": 545.11505, "r_y1": 390.29697, "r_x2": 545.11505, "r_y2": 381.39041, "r_x3": 308.862, "r_y3": 381.39041, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 402.25195, "r_x1": 545.11505, "r_y1": 402.25195, "r_x2": 545.11505, "r_y2": 393.3453999999999, "r_x3": 308.862, "r_y3": 393.3453999999999, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 414.20694, "r_x1": 545.11517, "r_y1": 414.20694, "r_x2": 545.11517, "r_y2": 405.30038, "r_x3": 308.862, "r_y3": 405.30038, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 426.16193, "r_x1": 545.11523, "r_y1": 426.16193, "r_x2": 545.11523, "r_y2": 417.25537, "r_x3": 308.862, "r_y3": 417.25537, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 438.11792, "r_x1": 545.11511, "r_y1": 438.11792, "r_x2": 545.11511, "r_y2": 429.21136000000007, "r_x3": 308.862, "r_y3": 429.21136000000007, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 450.0729099999999, "r_x1": 401.28503, "r_y1": 450.0729099999999, "r_x2": 401.28503, "r_y2": 441.16635, "r_x3": 308.862, "r_y3": 441.16635, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.86197, "t": 453.06778, "r": 545.11688, "b": 713.151848, "coord_origin": "TOPLEFT" }, "confidence": 0.9843218326568604, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 462.02417, "r_x1": 423.26236, "r_y1": 462.02417, "r_x2": 423.26236, "r_y2": 453.06778, "r_x3": 320.81699, "r_y3": 453.06778, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.26697, "r_y0": 462.0939, "r_x1": 545.10956, "r_y1": 462.0939, "r_x2": 545.10956, "r_y2": 453.18735, "r_x3": 423.26697, "r_y3": 453.18735, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 474.04889, "r_x1": 545.11511, "r_y1": 474.04889, "r_x2": 545.11511, "r_y2": 465.14233, "r_x3": 308.86197, "r_y3": 465.14233, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 486.00388, "r_x1": 335.7012, "r_y1": 486.00388, "r_x2": 335.7012, "r_y2": 477.09732, "r_x3": 308.86197, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85309, "r_y0": 486.00388, "r_x1": 545.11505, "r_y1": 486.00388, "r_x2": 545.11505, "r_y2": 477.09732, "r_x3": 345.85309, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.95886, "r_x1": 545.11493, "r_y1": 497.95886, "r_x2": 545.11493, "r_y2": 489.05231, "r_x3": 308.86197, "r_y3": 489.05231, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.91385, "r_x1": 545.11499, "r_y1": 509.91385, "r_x2": 545.11499, "r_y2": 501.00729, "r_x3": 308.86197, "r_y3": 501.00729, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.8698400000001, "r_x1": 545.11505, "r_y1": 521.8698400000001, "r_x2": 545.11505, "r_y2": 512.9632899999999, "r_x3": 308.86197, "r_y3": 512.9632899999999, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.82483, "r_x1": 545.11505, "r_y1": 533.82483, "r_x2": 545.11505, "r_y2": 524.91827, "r_x3": 308.86197, "r_y3": 524.91827, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.77983, "r_x1": 420.94119, "r_y1": 545.77983, "r_x2": 420.94119, "r_y2": 536.87328, "r_x3": 308.86197, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59497, "r_y0": 545.56065, "r_x1": 433.5575600000001, "r_y1": 545.56065, "r_x2": 433.5575600000001, "r_y2": 536.1559599999999, "r_x3": 423.59497, "r_y3": 536.1559599999999, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21198, "r_y0": 545.77983, "r_x1": 545.11316, "r_y1": 545.77983, "r_x2": 545.11316, "r_y2": 536.87328, "r_x3": 436.21198, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 557.73483, "r_x1": 545.11511, "r_y1": 557.73483, "r_x2": 545.11511, "r_y2": 548.82828, "r_x3": 308.86197, "r_y3": 548.82828, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 569.68983, "r_x1": 545.11493, "r_y1": 569.68983, "r_x2": 545.11493, "r_y2": 560.78328, "r_x3": 308.86197, "r_y3": 560.78328, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 581.6448399999999, "r_x1": 545.11499, "r_y1": 581.6448399999999, "r_x2": 545.11499, "r_y2": 572.73828, "r_x3": 308.86197, "r_y3": 572.73828, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 593.60083, "r_x1": 545.11505, "r_y1": 593.60083, "r_x2": 545.11505, "r_y2": 584.69427, "r_x3": 308.86197, "r_y3": 584.69427, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 605.55583, "r_x1": 497.07541, "r_y1": 605.55583, "r_x2": 497.07541, "r_y2": 596.6492800000001, "r_x3": 308.86197, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.80496, "r_y0": 605.33665, "r_x1": 509.76755, "r_y1": 605.33665, "r_x2": 509.76755, "r_y2": 595.93196, "r_x3": 499.80496, "r_y3": 595.93196, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.50098, "r_y0": 605.55583, "r_x1": 545.10852, "r_y1": 605.55583, "r_x2": 545.10852, "r_y2": 596.6492800000001, "r_x3": 512.50098, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 617.5108299999999, "r_x1": 545.11511, "r_y1": 617.5108299999999, "r_x2": 545.11511, "r_y2": 608.60428, "r_x3": 308.86197, "r_y3": 608.60428, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.46584, "r_x1": 545.11505, "r_y1": 629.46584, "r_x2": 545.11505, "r_y2": 620.55928, "r_x3": 308.86197, "r_y3": 620.55928, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.42084, "r_x1": 364.78201, "r_y1": 641.42084, "r_x2": 364.78201, "r_y2": 632.51428, "r_x3": 308.86197, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57397, "r_y0": 641.1917, "r_x1": 415.61362, "r_y1": 641.1917, "r_x2": 415.61362, "r_y2": 632.60394, "r_x3": 367.57397, "r_y3": 632.60394, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61298, "r_y0": 641.42084, "r_x1": 545.11688, "r_y1": 641.42084, "r_x2": 545.11688, "r_y2": 632.51428, "r_x3": 415.61298, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.37584, "r_x1": 545.11511, "r_y1": 653.37584, "r_x2": 545.11511, "r_y2": 644.46928, "r_x3": 308.86197, "r_y3": 644.46928, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 665.1027, "r_x1": 373.59894, "r_y1": 665.1027, "r_x2": 373.59894, "r_y2": 656.51494, "r_x3": 308.86197, "r_y3": 656.51494, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.90698, "r_y0": 665.33184, "r_x1": 545.11548, "r_y1": 665.33184, "r_x2": 545.11548, "r_y2": 656.4252799999999, "r_x3": 376.90698, "r_y3": 656.4252799999999, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28684, "r_x1": 545.11517, "r_y1": 677.28684, "r_x2": 545.11517, "r_y2": 668.38028, "r_x3": 308.862, "r_y3": 668.38028, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.0127, "r_x1": 356.90164, "r_y1": 689.0127, "r_x2": 356.90164, "r_y2": 680.42494, "r_x3": 308.862, "r_y3": 680.42494, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13101, "r_y0": 689.24184, "r_x1": 545.1153, "r_y1": 689.24184, "r_x2": 545.1153, "r_y2": 680.33528, "r_x3": 357.13101, "r_y3": 680.33528, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196846, "r_x1": 545.11511, "r_y1": 701.196846, "r_x2": 545.11511, "r_y2": 692.290283, "r_x3": 308.862, "r_y3": 692.290283, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151848, "r_x1": 545.11517, "r_y1": 713.151848, "r_x2": 545.11517, "r_y2": 704.245285, "r_x3": 308.862, "r_y3": 704.245285, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133282, "r": 300.10229, "b": 743.039845, "coord_origin": "TOPLEFT" }, "confidence": 0.8778094053268433, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039845, "r_x1": 300.10229, "r_y1": 743.039845, "r_x2": 300.10229, "r_y2": 734.133282, "r_x3": 295.121, "r_y3": 734.133282, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 12, "page_no": 1, "cluster": { "id": 12, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36505, "b": 96.06994999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9656890034675598, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36505, "r_y1": 84.11492999999996, "r_x2": 286.36505, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 112.64721999999999, "r_y1": 96.06994999999995, "r_x2": 112.64721999999999, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "considered as a solved problem, given enough ground-truth data to train on." }, { "label": "text", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 99.57141000000001, "r": 286.36514, "b": 228.03008999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9838606119155884, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 108.47797000000003, "r_x1": 286.36496, "r_y1": 108.47797000000003, "r_x2": 286.36496, "r_y2": 99.57141000000001, "r_x3": 62.067001, "r_y3": 99.57141000000001, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.43297999999993, "r_x1": 74.749512, "r_y1": 120.43297999999993, "r_x2": 74.749512, "r_y2": 111.52643, "r_x3": 50.112, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.334793, "r_y0": 120.43297999999993, "r_x1": 286.36514, "r_y1": 120.43297999999993, "r_x2": 286.36514, "r_y2": 111.52643, "r_x3": 81.334793, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 132.38800000000003, "r_x1": 286.36511, "r_y1": 132.38800000000003, "r_x2": 286.36511, "r_y2": 123.48145, "r_x3": 50.112, "r_y3": 123.48145, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 144.34302000000002, "r_x1": 286.36511, "r_y1": 144.34302000000002, "r_x2": 286.36511, "r_y2": 135.43646, "r_x3": 50.112, "r_y3": 135.43646, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 156.29900999999995, "r_x1": 286.36505, "r_y1": 156.29900999999995, "r_x2": 286.36505, "r_y2": 147.39246000000003, "r_x3": 50.112, "r_y3": 147.39246000000003, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 168.25402999999994, "r_x1": 286.36511, "r_y1": 168.25402999999994, "r_x2": 286.36511, "r_y2": 159.34747000000004, "r_x3": 50.112, "r_y3": 159.34747000000004, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.20905000000005, "r_x1": 286.36508, "r_y1": 180.20905000000005, "r_x2": 286.36508, "r_y2": 171.30249000000003, "r_x3": 50.112, "r_y3": 171.30249000000003, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.16405999999995, "r_x1": 286.36511, "r_y1": 192.16405999999995, "r_x2": 286.36511, "r_y2": 183.25751000000002, "r_x3": 50.112, "r_y3": 183.25751000000002, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.11908000000005, "r_x1": 286.36508, "r_y1": 204.11908000000005, "r_x2": 286.36508, "r_y2": 195.21252000000004, "r_x3": 50.112, "r_y3": 195.21252000000004, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.07410000000004, "r_x1": 286.36514, "r_y1": 216.07410000000004, "r_x2": 286.36514, "r_y2": 207.16754000000003, "r_x3": 50.112, "r_y3": 207.16754000000003, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.03008999999997, "r_x1": 278.66397, "r_y1": 228.03008999999997, "r_x2": 278.66397, "r_y2": 219.12354000000005, "r_x3": 50.112, "r_y3": 219.12354000000005, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image." }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.112, "t": 231.53156, "r": 286.36511, "b": 371.94507, "coord_origin": "TOPLEFT" }, "confidence": 0.9855920076370239, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 240.43811000000005, "r_x1": 286.36493, "r_y1": 240.43811000000005, "r_x2": 286.36493, "r_y2": 231.53156, "r_x3": 62.067001, "r_y3": 231.53156, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 252.39313000000004, "r_x1": 286.36511, "r_y1": 252.39313000000004, "r_x2": 286.36511, "r_y2": 243.48657000000003, "r_x3": 50.112, "r_y3": 243.48657000000003, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.34813999999994, "r_x1": 286.36511, "r_y1": 264.34813999999994, "r_x2": 286.36511, "r_y2": 255.44159000000002, "r_x3": 50.112, "r_y3": 255.44159000000002, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.30316000000005, "r_x1": 286.36502, "r_y1": 276.30316000000005, "r_x2": 286.36502, "r_y2": 267.39661, "r_x3": 50.112, "r_y3": 267.39661, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.25815, "r_x1": 286.36508, "r_y1": 288.25815, "r_x2": 286.36508, "r_y2": 279.35155999999995, "r_x3": 50.112, "r_y3": 279.35155999999995, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.21414, "r_x1": 88.567635, "r_y1": 300.21414, "r_x2": 88.567635, "r_y2": 291.30759, "r_x3": 50.112, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.501602, "r_y0": 300.21414, "r_x1": 286.36505, "r_y1": 300.21414, "r_x2": 286.36505, "r_y2": 291.30759, "r_x3": 95.501602, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.16913, "r_x1": 286.36508, "r_y1": 312.16913, "r_x2": 286.36508, "r_y2": 303.26257, "r_x3": 50.112, "r_y3": 303.26257, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.12411, "r_x1": 286.36511, "r_y1": 324.12411, "r_x2": 286.36511, "r_y2": 315.21756, "r_x3": 50.112, "r_y3": 315.21756, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.0791, "r_x1": 286.36505, "r_y1": 336.0791, "r_x2": 286.36505, "r_y2": 327.17255, "r_x3": 50.112, "r_y3": 327.17255, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.03409, "r_x1": 286.36511, "r_y1": 348.03409, "r_x2": 286.36511, "r_y2": 339.12753, "r_x3": 50.112, "r_y3": 339.12753, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.99008, "r_x1": 286.36508, "r_y1": 359.99008, "r_x2": 286.36508, "r_y2": 351.08353, "r_x3": 50.112, "r_y3": 351.08353, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.94507, "r_x1": 76.951241, "r_y1": 371.94507, "r_x2": 76.951241, "r_y2": 363.03851, "r_x3": 50.112, "r_y3": 363.03851, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image." }, { "label": "text", "id": 7, "page_no": 1, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.112, "t": 375.4465, "r": 286.36658, "b": 432.173, "coord_origin": "TOPLEFT" }, "confidence": 0.9820111393928528, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 384.35306, "r_x1": 286.36499, "r_y1": 384.35306, "r_x2": 286.36499, "r_y2": 375.4465, "r_x3": 62.067001, "r_y3": 375.4465, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.30804, "r_x1": 120.98594, "r_y1": 396.30804, "r_x2": 120.98594, "r_y2": 387.40149, "r_x3": 50.112, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.901, "r_y0": 396.23830999999996, "r_x1": 179.7314, "r_y1": 396.23830999999996, "r_x2": 179.7314, "r_y2": 387.28192, "r_x3": 123.901, "r_y3": 387.28192, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.646, "r_y0": 396.30804, "r_x1": 286.36658, "r_y1": 396.30804, "r_x2": 286.36658, "r_y2": 387.40149, "r_x3": 182.646, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 408.26302999999996, "r_x1": 181.75778, "r_y1": 408.26302999999996, "r_x2": 181.75778, "r_y2": 399.35648, "r_x3": 50.112, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.104, "r_y0": 408.1933, "r_x1": 240.2034, "r_y1": 408.1933, "r_x2": 240.2034, "r_y2": 399.23690999999997, "r_x3": 184.104, "r_y3": 399.23690999999997, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.20401, "r_y0": 408.26302999999996, "r_x1": 286.36069, "r_y1": 408.26302999999996, "r_x2": 286.36069, "r_y2": 399.35648, "r_x3": 240.20401, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 420.21802, "r_x1": 286.36511, "r_y1": 420.21802, "r_x2": 286.36511, "r_y2": 411.31146, "r_x3": 50.112015, "r_y3": 411.31146, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 432.173, "r_x1": 82.520355, "r_y1": 432.173, "r_x2": 82.520355, "r_y2": 423.26645, "r_x3": 50.112015, "r_y3": 423.26645, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:" }, { "label": "list_item", "id": 6, "page_no": 1, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 61.569016, "t": 444.43188, "r": 286.3649, "b": 489.32297, "coord_origin": "TOPLEFT" }, "confidence": 0.9822162389755249, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 453.45801, "r_x1": 70.741714, "r_y1": 453.45801, "r_x2": 70.741714, "r_y2": 444.55145, "r_x3": 61.569016, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.034889, "r_y0": 453.45801, "r_x1": 117.10054, "r_y1": 453.45801, "r_x2": 117.10054, "r_y2": 444.55145, "r_x3": 73.034889, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59001, "r_y0": 453.38828, "r_x1": 175.42041, "r_y1": 453.38828, "r_x2": 175.42041, "r_y2": 444.43188, "r_x3": 119.59001, "r_y3": 444.43188, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42102, "r_y0": 453.45801, "r_x1": 286.36453, "r_y1": 453.45801, "r_x2": 286.36453, "r_y2": 444.55145, "r_x3": 175.42102, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 465.41299, "r_x1": 286.3649, "r_y1": 465.41299, "r_x2": 286.3649, "r_y2": 456.50644000000005, "r_x3": 70.037018, "r_y3": 456.50644000000005, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 477.36798, "r_x1": 286.3649, "r_y1": 477.36798, "r_x2": 286.3649, "r_y2": 468.46143, "r_x3": 70.037018, "r_y3": 468.46143, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 489.32297, "r_x1": 99.635902, "r_y1": 489.32297, "r_x2": 99.635902, "r_y2": 480.41641, "r_x3": 70.037018, "r_y3": 480.41641, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach." }, { "label": "list_item", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 61.569016, "t": 502.03384, "r": 286.3649, "b": 546.9259500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.982271671295166, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 511.05997, "r_x1": 71.619438, "r_y1": 511.05997, "r_x2": 71.619438, "r_y2": 502.15341, "r_x3": 61.569016, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.132042, "r_y0": 511.05997, "r_x1": 196.10396, "r_y1": 511.05997, "r_x2": 196.10396, "r_y2": 502.15341, "r_x3": 74.132042, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31001, "r_y0": 510.99023, "r_x1": 256.14041, "r_y1": 510.99023, "r_x2": 256.14041, "r_y2": 502.03384, "r_x3": 200.31001, "r_y3": 502.03384, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35001, "r_y0": 511.05997, "r_x1": 286.36237, "r_y1": 511.05997, "r_x2": 286.36237, "r_y2": 502.15341, "r_x3": 260.35001, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 523.01495, "r_x1": 286.3649, "r_y1": 523.01495, "r_x2": 286.3649, "r_y2": 514.1084000000001, "r_x3": 70.037003, "r_y3": 514.1084000000001, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 534.97095, "r_x1": 286.36487, "r_y1": 534.97095, "r_x2": 286.36487, "r_y2": 526.06439, "r_x3": 70.037003, "r_y3": 526.06439, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 546.9259500000001, "r_x1": 161.65305, "r_y1": 546.9259500000001, "r_x2": 161.65305, "r_y2": 538.0193899999999, "r_x3": 70.037003, "r_y3": 538.0193899999999, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works." }, { "label": "list_item", "id": 9, "page_no": 1, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 61.569, "t": 559.63684, "r": 286.36493, "b": 592.57295, "coord_origin": "TOPLEFT" }, "confidence": 0.9802963733673096, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 568.66295, "r_x1": 71.115913, "r_y1": 568.66295, "r_x2": 71.115913, "r_y2": 559.75639, "r_x3": 61.569, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.502647, "r_y0": 568.66295, "r_x1": 116.71199, "r_y1": 568.66295, "r_x2": 116.71199, "r_y2": 559.75639, "r_x3": 73.502647, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.583, "r_y0": 568.59322, "r_x1": 177.68239, "r_y1": 568.59322, "r_x2": 177.68239, "r_y2": 559.63684, "r_x3": 121.583, "r_y3": 559.63684, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55301, "r_y0": 568.66295, "r_x1": 286.36328, "r_y1": 568.66295, "r_x2": 286.36328, "r_y2": 559.75639, "r_x3": 182.55301, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 580.6179500000001, "r_x1": 286.36493, "r_y1": 580.6179500000001, "r_x2": 286.36493, "r_y2": 571.7114, "r_x3": 70.03701, "r_y3": 571.7114, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 592.57295, "r_x1": 82.400597, "r_y1": 592.57295, "r_x2": 82.400597, "r_y2": 583.6664000000001, "r_x3": 70.03701, "r_y3": 583.6664000000001, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity." }, { "label": "list_item", "id": 8, "page_no": 1, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 61.569008000000004, "t": 605.4034, "r": 286.36508, "b": 638.22095, "coord_origin": "TOPLEFT" }, "confidence": 0.9806395173072815, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569008000000004, "r_y0": 614.30995, "r_x1": 72.332527, "r_y1": 614.30995, "r_x2": 72.332527, "r_y2": 605.4034, "r_x3": 61.569008000000004, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.023399, "r_y0": 614.30995, "r_x1": 286.36508, "r_y1": 614.30995, "r_x2": 286.36508, "r_y2": 605.4034, "r_x3": 75.023399, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 626.26495, "r_x1": 286.36487, "r_y1": 626.26495, "r_x2": 286.36487, "r_y2": 617.3584, "r_x3": 70.03701, "r_y3": 617.3584, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 638.22095, "r_x1": 198.05641, "r_y1": 638.22095, "r_x2": 198.05641, "r_y2": 629.31439, "r_x3": 70.03701, "r_y3": 629.31439, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility." }, { "label": "text", "id": 11, "page_no": 1, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.112007, "t": 650.59839, "r": 286.36511, "b": 695.369957, "coord_origin": "TOPLEFT" }, "confidence": 0.9742533564567566, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067009000000006, "r_y0": 659.50494, "r_x1": 286.36496, "r_y1": 659.50494, "r_x2": 286.36496, "r_y2": 650.59839, "r_x3": 62.067009000000006, "r_y3": 650.59839, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 671.45995, "r_x1": 286.36511, "r_y1": 671.45995, "r_x2": 286.36511, "r_y2": 662.55339, "r_x3": 50.112007, "r_y3": 662.55339, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 683.41496, "r_x1": 286.36511, "r_y1": 683.41496, "r_x2": 286.36511, "r_y2": 674.50839, "r_x3": 50.112007, "r_y3": 674.50839, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 695.369957, "r_x1": 286.36511, "r_y1": 695.369957, "r_x2": 286.36511, "r_y2": 686.46339, "r_x3": 50.112007, "r_y3": 686.46339, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe" }, { "label": "footnote", "id": 14, "page_no": 1, "cluster": { "id": 14, "label": "footnote", "bbox": { "l": 60.97100100000001, "t": 705.596275, "r": 183.73055, "b": 712.721542, "coord_origin": "TOPLEFT" }, "confidence": 0.895367443561554, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97100100000001, "r_y0": 712.721542, "r_x1": 183.73055, "r_y1": 712.721542, "r_x2": 183.73055, "r_y2": 705.596275, "r_x3": 60.97100100000001, "r_y3": 705.596275, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "$^{1}$https://github.com/IBM/SynthTabNet" }, { "label": "text", "id": 10, "page_no": 1, "cluster": { "id": 10, "label": "text", "bbox": { "l": 308.862, "t": 75.20836999999995, "r": 545.11511, "b": 108.02495999999985, "coord_origin": "TOPLEFT" }, "confidence": 0.9774322509765625, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 545.11511, "r_y1": 84.11492999999996, "r_x2": 545.11511, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11505, "r_y1": 96.06994999999995, "r_x2": 545.11505, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 508.08417000000003, "r_y1": 108.02495999999985, "r_x2": 508.08417000000003, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community." }, { "label": "section_header", "id": 13, "page_no": 1, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 308.862, "t": 121.73193000000003, "r": 498.28021, "b": 132.47968000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9428724646568298, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 132.47968000000003, "r_x1": 315.5831, "r_y1": 132.47968000000003, "r_x2": 315.5831, "r_y2": 121.73193000000003, "r_x3": 308.862, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54456, "r_y0": 132.47968000000003, "r_x1": 498.28021, "r_y1": 132.47968000000003, "r_x2": 498.28021, "r_y2": 121.73193000000003, "r_x3": 324.54456, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Previous work and State of the Art" }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 142.22136999999998, "r": 545.11517, "b": 330.45502, "coord_origin": "TOPLEFT" }, "confidence": 0.987194836139679, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 151.12793, "r_x1": 545.11493, "r_y1": 151.12793, "r_x2": 545.11493, "r_y2": 142.22136999999998, "r_x3": 320.81699, "r_y3": 142.22136999999998, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 163.08294999999998, "r_x1": 545.11505, "r_y1": 163.08294999999998, "r_x2": 545.11505, "r_y2": 154.17638999999997, "r_x3": 308.862, "r_y3": 154.17638999999997, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 175.03796, "r_x1": 522.55975, "r_y1": 175.03796, "r_x2": 522.55975, "r_y2": 166.13140999999996, "r_x3": 308.862, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 175.03796, "r_x1": 545.11505, "r_y1": 175.03796, "r_x2": 545.11505, "r_y2": 166.13140999999996, "r_x3": 529.62323, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 186.99298, "r_x1": 545.11517, "r_y1": 186.99298, "r_x2": 545.11517, "r_y2": 178.08642999999995, "r_x3": 308.862, "r_y3": 178.08642999999995, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 198.94799999999998, "r_x1": 545.11511, "r_y1": 198.94799999999998, "r_x2": 545.11511, "r_y2": 190.04143999999997, "r_x3": 308.862, "r_y3": 190.04143999999997, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 210.90301999999997, "r_x1": 346.97891, "r_y1": 210.90301999999997, "r_x2": 346.97891, "r_y2": 201.99645999999996, "r_x3": 308.862, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.86929, "r_y0": 210.90301999999997, "r_x1": 545.11511, "r_y1": 210.90301999999997, "r_x2": 545.11511, "r_y2": 201.99645999999996, "r_x3": 354.86929, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 222.85901, "r_x1": 545.11505, "r_y1": 222.85901, "r_x2": 545.11505, "r_y2": 213.95245, "r_x3": 308.862, "r_y3": 213.95245, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 234.81403, "r_x1": 530.9184, "r_y1": 234.81403, "r_x2": 530.9184, "r_y2": 225.90747, "r_x3": 308.862, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92212, "r_y0": 234.81403, "r_x1": 545.11511, "r_y1": 234.81403, "r_x2": 545.11511, "r_y2": 225.90747, "r_x3": 537.92212, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 246.76904000000002, "r_x1": 545.11517, "r_y1": 246.76904000000002, "r_x2": 545.11517, "r_y2": 237.86248999999998, "r_x3": 308.862, "r_y3": 237.86248999999998, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.72406, "r_x1": 545.11511, "r_y1": 258.72406, "r_x2": 545.11511, "r_y2": 249.8175, "r_x3": 308.862, "r_y3": 249.8175, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.67908, "r_x1": 439.8402699999999, "r_y1": 270.67908, "r_x2": 439.8402699999999, "r_y2": 261.77252, "r_x3": 308.862, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.43999999999994, "r_y0": 270.45989999999995, "r_x1": 452.1889, "r_y1": 270.45989999999995, "r_x2": 452.1889, "r_y2": 261.61310000000003, "r_x3": 444.43999999999994, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89001, "r_y0": 270.45989999999995, "r_x1": 470.83392000000003, "r_y1": 270.45989999999995, "r_x2": 470.83392000000003, "r_y2": 261.61310000000003, "r_x3": 455.89001, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83401, "r_y0": 270.67908, "r_x1": 545.11517, "r_y1": 270.67908, "r_x2": 545.11517, "r_y2": 261.77252, "r_x3": 470.83401, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.63406, "r_x1": 545.11511, "r_y1": 282.63406, "r_x2": 545.11511, "r_y2": 273.72748, "r_x3": 308.862, "r_y3": 273.72748, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.59006, "r_x1": 545.11511, "r_y1": 294.59006, "r_x2": 545.11511, "r_y2": 285.6835, "r_x3": 308.862, "r_y3": 285.6835, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 306.54504, "r_x1": 545.11511, "r_y1": 306.54504, "r_x2": 545.11511, "r_y2": 297.63849, "r_x3": 308.862, "r_y3": 297.63849, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 318.50003000000004, "r_x1": 545.11517, "r_y1": 318.50003000000004, "r_x2": 545.11517, "r_y2": 309.59348, "r_x3": 308.862, "r_y3": 309.59348, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 330.45502, "r_x1": 425.92255, "r_y1": 330.45502, "r_x2": 425.92255, "r_y2": 321.54846, "r_x3": 308.862, "r_y3": 321.54846, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc." }, { "label": "text", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.862, "t": 333.56946, "r": 545.11523, "b": 450.0729099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9869040250778198, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 342.47601, "r_x1": 545.11499, "r_y1": 342.47601, "r_x2": 545.11499, "r_y2": 333.56946, "r_x3": 320.81699, "r_y3": 333.56946, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 354.43100000000004, "r_x1": 545.11499, "r_y1": 354.43100000000004, "r_x2": 545.11499, "r_y2": 345.52444, "r_x3": 308.862, "r_y3": 345.52444, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 366.38599, "r_x1": 545.11517, "r_y1": 366.38599, "r_x2": 545.11517, "r_y2": 357.47943, "r_x3": 308.862, "r_y3": 357.47943, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 378.34198, "r_x1": 545.11511, "r_y1": 378.34198, "r_x2": 545.11511, "r_y2": 369.43542, "r_x3": 308.862, "r_y3": 369.43542, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 390.29697, "r_x1": 545.11505, "r_y1": 390.29697, "r_x2": 545.11505, "r_y2": 381.39041, "r_x3": 308.862, "r_y3": 381.39041, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 402.25195, "r_x1": 545.11505, "r_y1": 402.25195, "r_x2": 545.11505, "r_y2": 393.3453999999999, "r_x3": 308.862, "r_y3": 393.3453999999999, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 414.20694, "r_x1": 545.11517, "r_y1": 414.20694, "r_x2": 545.11517, "r_y2": 405.30038, "r_x3": 308.862, "r_y3": 405.30038, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 426.16193, "r_x1": 545.11523, "r_y1": 426.16193, "r_x2": 545.11523, "r_y2": 417.25537, "r_x3": 308.862, "r_y3": 417.25537, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 438.11792, "r_x1": 545.11511, "r_y1": 438.11792, "r_x2": 545.11511, "r_y2": 429.21136000000007, "r_x3": 308.862, "r_y3": 429.21136000000007, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 450.0729099999999, "r_x1": 401.28503, "r_y1": 450.0729099999999, "r_x2": 401.28503, "r_y2": 441.16635, "r_x3": 308.862, "r_y3": 441.16635, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification." }, { "label": "text", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86197, "t": 453.06778, "r": 545.11688, "b": 713.151848, "coord_origin": "TOPLEFT" }, "confidence": 0.9843218326568604, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 462.02417, "r_x1": 423.26236, "r_y1": 462.02417, "r_x2": 423.26236, "r_y2": 453.06778, "r_x3": 320.81699, "r_y3": 453.06778, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.26697, "r_y0": 462.0939, "r_x1": 545.10956, "r_y1": 462.0939, "r_x2": 545.10956, "r_y2": 453.18735, "r_x3": 423.26697, "r_y3": 453.18735, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 474.04889, "r_x1": 545.11511, "r_y1": 474.04889, "r_x2": 545.11511, "r_y2": 465.14233, "r_x3": 308.86197, "r_y3": 465.14233, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 486.00388, "r_x1": 335.7012, "r_y1": 486.00388, "r_x2": 335.7012, "r_y2": 477.09732, "r_x3": 308.86197, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85309, "r_y0": 486.00388, "r_x1": 545.11505, "r_y1": 486.00388, "r_x2": 545.11505, "r_y2": 477.09732, "r_x3": 345.85309, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.95886, "r_x1": 545.11493, "r_y1": 497.95886, "r_x2": 545.11493, "r_y2": 489.05231, "r_x3": 308.86197, "r_y3": 489.05231, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.91385, "r_x1": 545.11499, "r_y1": 509.91385, "r_x2": 545.11499, "r_y2": 501.00729, "r_x3": 308.86197, "r_y3": 501.00729, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.8698400000001, "r_x1": 545.11505, "r_y1": 521.8698400000001, "r_x2": 545.11505, "r_y2": 512.9632899999999, "r_x3": 308.86197, "r_y3": 512.9632899999999, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.82483, "r_x1": 545.11505, "r_y1": 533.82483, "r_x2": 545.11505, "r_y2": 524.91827, "r_x3": 308.86197, "r_y3": 524.91827, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.77983, "r_x1": 420.94119, "r_y1": 545.77983, "r_x2": 420.94119, "r_y2": 536.87328, "r_x3": 308.86197, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59497, "r_y0": 545.56065, "r_x1": 433.5575600000001, "r_y1": 545.56065, "r_x2": 433.5575600000001, "r_y2": 536.1559599999999, "r_x3": 423.59497, "r_y3": 536.1559599999999, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21198, "r_y0": 545.77983, "r_x1": 545.11316, "r_y1": 545.77983, "r_x2": 545.11316, "r_y2": 536.87328, "r_x3": 436.21198, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 557.73483, "r_x1": 545.11511, "r_y1": 557.73483, "r_x2": 545.11511, "r_y2": 548.82828, "r_x3": 308.86197, "r_y3": 548.82828, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 569.68983, "r_x1": 545.11493, "r_y1": 569.68983, "r_x2": 545.11493, "r_y2": 560.78328, "r_x3": 308.86197, "r_y3": 560.78328, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 581.6448399999999, "r_x1": 545.11499, "r_y1": 581.6448399999999, "r_x2": 545.11499, "r_y2": 572.73828, "r_x3": 308.86197, "r_y3": 572.73828, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 593.60083, "r_x1": 545.11505, "r_y1": 593.60083, "r_x2": 545.11505, "r_y2": 584.69427, "r_x3": 308.86197, "r_y3": 584.69427, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 605.55583, "r_x1": 497.07541, "r_y1": 605.55583, "r_x2": 497.07541, "r_y2": 596.6492800000001, "r_x3": 308.86197, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.80496, "r_y0": 605.33665, "r_x1": 509.76755, "r_y1": 605.33665, "r_x2": 509.76755, "r_y2": 595.93196, "r_x3": 499.80496, "r_y3": 595.93196, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.50098, "r_y0": 605.55583, "r_x1": 545.10852, "r_y1": 605.55583, "r_x2": 545.10852, "r_y2": 596.6492800000001, "r_x3": 512.50098, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 617.5108299999999, "r_x1": 545.11511, "r_y1": 617.5108299999999, "r_x2": 545.11511, "r_y2": 608.60428, "r_x3": 308.86197, "r_y3": 608.60428, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.46584, "r_x1": 545.11505, "r_y1": 629.46584, "r_x2": 545.11505, "r_y2": 620.55928, "r_x3": 308.86197, "r_y3": 620.55928, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.42084, "r_x1": 364.78201, "r_y1": 641.42084, "r_x2": 364.78201, "r_y2": 632.51428, "r_x3": 308.86197, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57397, "r_y0": 641.1917, "r_x1": 415.61362, "r_y1": 641.1917, "r_x2": 415.61362, "r_y2": 632.60394, "r_x3": 367.57397, "r_y3": 632.60394, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61298, "r_y0": 641.42084, "r_x1": 545.11688, "r_y1": 641.42084, "r_x2": 545.11688, "r_y2": 632.51428, "r_x3": 415.61298, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.37584, "r_x1": 545.11511, "r_y1": 653.37584, "r_x2": 545.11511, "r_y2": 644.46928, "r_x3": 308.86197, "r_y3": 644.46928, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 665.1027, "r_x1": 373.59894, "r_y1": 665.1027, "r_x2": 373.59894, "r_y2": 656.51494, "r_x3": 308.86197, "r_y3": 656.51494, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.90698, "r_y0": 665.33184, "r_x1": 545.11548, "r_y1": 665.33184, "r_x2": 545.11548, "r_y2": 656.4252799999999, "r_x3": 376.90698, "r_y3": 656.4252799999999, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28684, "r_x1": 545.11517, "r_y1": 677.28684, "r_x2": 545.11517, "r_y2": 668.38028, "r_x3": 308.862, "r_y3": 668.38028, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.0127, "r_x1": 356.90164, "r_y1": 689.0127, "r_x2": 356.90164, "r_y2": 680.42494, "r_x3": 308.862, "r_y3": 680.42494, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13101, "r_y0": 689.24184, "r_x1": 545.1153, "r_y1": 689.24184, "r_x2": 545.1153, "r_y2": 680.33528, "r_x3": 357.13101, "r_y3": 680.33528, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196846, "r_x1": 545.11511, "r_y1": 701.196846, "r_x2": 545.11511, "r_y2": 692.290283, "r_x3": 308.862, "r_y3": 692.290283, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151848, "r_x1": 545.11517, "r_y1": 713.151848, "r_x2": 545.11517, "r_y2": 704.245285, "r_x3": 308.862, "r_y3": 704.245285, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the" }, { "label": "page_footer", "id": 15, "page_no": 1, "cluster": { "id": 15, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133282, "r": 300.10229, "b": 743.039845, "coord_origin": "TOPLEFT" }, "confidence": 0.8778094053268433, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039845, "r_x1": 300.10229, "r_y1": 743.039845, "r_x2": 300.10229, "r_y2": 734.133282, "r_x3": 295.121, "r_y3": 734.133282, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" } ], "body": [ { "label": "text", "id": 12, "page_no": 1, "cluster": { "id": 12, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36505, "b": 96.06994999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9656890034675598, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36505, "r_y1": 84.11492999999996, "r_x2": 286.36505, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 112.64721999999999, "r_y1": 96.06994999999995, "r_x2": 112.64721999999999, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "considered as a solved problem, given enough ground-truth data to train on." }, { "label": "text", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 99.57141000000001, "r": 286.36514, "b": 228.03008999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9838606119155884, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 108.47797000000003, "r_x1": 286.36496, "r_y1": 108.47797000000003, "r_x2": 286.36496, "r_y2": 99.57141000000001, "r_x3": 62.067001, "r_y3": 99.57141000000001, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.43297999999993, "r_x1": 74.749512, "r_y1": 120.43297999999993, "r_x2": 74.749512, "r_y2": 111.52643, "r_x3": 50.112, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.334793, "r_y0": 120.43297999999993, "r_x1": 286.36514, "r_y1": 120.43297999999993, "r_x2": 286.36514, "r_y2": 111.52643, "r_x3": 81.334793, "r_y3": 111.52643, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 132.38800000000003, "r_x1": 286.36511, "r_y1": 132.38800000000003, "r_x2": 286.36511, "r_y2": 123.48145, "r_x3": 50.112, "r_y3": 123.48145, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 144.34302000000002, "r_x1": 286.36511, "r_y1": 144.34302000000002, "r_x2": 286.36511, "r_y2": 135.43646, "r_x3": 50.112, "r_y3": 135.43646, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 156.29900999999995, "r_x1": 286.36505, "r_y1": 156.29900999999995, "r_x2": 286.36505, "r_y2": 147.39246000000003, "r_x3": 50.112, "r_y3": 147.39246000000003, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 168.25402999999994, "r_x1": 286.36511, "r_y1": 168.25402999999994, "r_x2": 286.36511, "r_y2": 159.34747000000004, "r_x3": 50.112, "r_y3": 159.34747000000004, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.20905000000005, "r_x1": 286.36508, "r_y1": 180.20905000000005, "r_x2": 286.36508, "r_y2": 171.30249000000003, "r_x3": 50.112, "r_y3": 171.30249000000003, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.16405999999995, "r_x1": 286.36511, "r_y1": 192.16405999999995, "r_x2": 286.36511, "r_y2": 183.25751000000002, "r_x3": 50.112, "r_y3": 183.25751000000002, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.11908000000005, "r_x1": 286.36508, "r_y1": 204.11908000000005, "r_x2": 286.36508, "r_y2": 195.21252000000004, "r_x3": 50.112, "r_y3": 195.21252000000004, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.07410000000004, "r_x1": 286.36514, "r_y1": 216.07410000000004, "r_x2": 286.36514, "r_y2": 207.16754000000003, "r_x3": 50.112, "r_y3": 207.16754000000003, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.03008999999997, "r_x1": 278.66397, "r_y1": 228.03008999999997, "r_x2": 278.66397, "r_y2": 219.12354000000005, "r_x3": 50.112, "r_y3": 219.12354000000005, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image." }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.112, "t": 231.53156, "r": 286.36511, "b": 371.94507, "coord_origin": "TOPLEFT" }, "confidence": 0.9855920076370239, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 240.43811000000005, "r_x1": 286.36493, "r_y1": 240.43811000000005, "r_x2": 286.36493, "r_y2": 231.53156, "r_x3": 62.067001, "r_y3": 231.53156, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 252.39313000000004, "r_x1": 286.36511, "r_y1": 252.39313000000004, "r_x2": 286.36511, "r_y2": 243.48657000000003, "r_x3": 50.112, "r_y3": 243.48657000000003, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.34813999999994, "r_x1": 286.36511, "r_y1": 264.34813999999994, "r_x2": 286.36511, "r_y2": 255.44159000000002, "r_x3": 50.112, "r_y3": 255.44159000000002, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.30316000000005, "r_x1": 286.36502, "r_y1": 276.30316000000005, "r_x2": 286.36502, "r_y2": 267.39661, "r_x3": 50.112, "r_y3": 267.39661, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.25815, "r_x1": 286.36508, "r_y1": 288.25815, "r_x2": 286.36508, "r_y2": 279.35155999999995, "r_x3": 50.112, "r_y3": 279.35155999999995, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.21414, "r_x1": 88.567635, "r_y1": 300.21414, "r_x2": 88.567635, "r_y2": 291.30759, "r_x3": 50.112, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.501602, "r_y0": 300.21414, "r_x1": 286.36505, "r_y1": 300.21414, "r_x2": 286.36505, "r_y2": 291.30759, "r_x3": 95.501602, "r_y3": 291.30759, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.16913, "r_x1": 286.36508, "r_y1": 312.16913, "r_x2": 286.36508, "r_y2": 303.26257, "r_x3": 50.112, "r_y3": 303.26257, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.12411, "r_x1": 286.36511, "r_y1": 324.12411, "r_x2": 286.36511, "r_y2": 315.21756, "r_x3": 50.112, "r_y3": 315.21756, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.0791, "r_x1": 286.36505, "r_y1": 336.0791, "r_x2": 286.36505, "r_y2": 327.17255, "r_x3": 50.112, "r_y3": 327.17255, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.03409, "r_x1": 286.36511, "r_y1": 348.03409, "r_x2": 286.36511, "r_y2": 339.12753, "r_x3": 50.112, "r_y3": 339.12753, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.99008, "r_x1": 286.36508, "r_y1": 359.99008, "r_x2": 286.36508, "r_y2": 351.08353, "r_x3": 50.112, "r_y3": 351.08353, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.94507, "r_x1": 76.951241, "r_y1": 371.94507, "r_x2": 76.951241, "r_y2": 363.03851, "r_x3": 50.112, "r_y3": 363.03851, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image." }, { "label": "text", "id": 7, "page_no": 1, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.112, "t": 375.4465, "r": 286.36658, "b": 432.173, "coord_origin": "TOPLEFT" }, "confidence": 0.9820111393928528, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 384.35306, "r_x1": 286.36499, "r_y1": 384.35306, "r_x2": 286.36499, "r_y2": 375.4465, "r_x3": 62.067001, "r_y3": 375.4465, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.30804, "r_x1": 120.98594, "r_y1": 396.30804, "r_x2": 120.98594, "r_y2": 387.40149, "r_x3": 50.112, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.901, "r_y0": 396.23830999999996, "r_x1": 179.7314, "r_y1": 396.23830999999996, "r_x2": 179.7314, "r_y2": 387.28192, "r_x3": 123.901, "r_y3": 387.28192, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.646, "r_y0": 396.30804, "r_x1": 286.36658, "r_y1": 396.30804, "r_x2": 286.36658, "r_y2": 387.40149, "r_x3": 182.646, "r_y3": 387.40149, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 408.26302999999996, "r_x1": 181.75778, "r_y1": 408.26302999999996, "r_x2": 181.75778, "r_y2": 399.35648, "r_x3": 50.112, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.104, "r_y0": 408.1933, "r_x1": 240.2034, "r_y1": 408.1933, "r_x2": 240.2034, "r_y2": 399.23690999999997, "r_x3": 184.104, "r_y3": 399.23690999999997, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.20401, "r_y0": 408.26302999999996, "r_x1": 286.36069, "r_y1": 408.26302999999996, "r_x2": 286.36069, "r_y2": 399.35648, "r_x3": 240.20401, "r_y3": 399.35648, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 420.21802, "r_x1": 286.36511, "r_y1": 420.21802, "r_x2": 286.36511, "r_y2": 411.31146, "r_x3": 50.112015, "r_y3": 411.31146, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 432.173, "r_x1": 82.520355, "r_y1": 432.173, "r_x2": 82.520355, "r_y2": 423.26645, "r_x3": 50.112015, "r_y3": 423.26645, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:" }, { "label": "list_item", "id": 6, "page_no": 1, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 61.569016, "t": 444.43188, "r": 286.3649, "b": 489.32297, "coord_origin": "TOPLEFT" }, "confidence": 0.9822162389755249, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 453.45801, "r_x1": 70.741714, "r_y1": 453.45801, "r_x2": 70.741714, "r_y2": 444.55145, "r_x3": 61.569016, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.034889, "r_y0": 453.45801, "r_x1": 117.10054, "r_y1": 453.45801, "r_x2": 117.10054, "r_y2": 444.55145, "r_x3": 73.034889, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59001, "r_y0": 453.38828, "r_x1": 175.42041, "r_y1": 453.38828, "r_x2": 175.42041, "r_y2": 444.43188, "r_x3": 119.59001, "r_y3": 444.43188, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42102, "r_y0": 453.45801, "r_x1": 286.36453, "r_y1": 453.45801, "r_x2": 286.36453, "r_y2": 444.55145, "r_x3": 175.42102, "r_y3": 444.55145, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 465.41299, "r_x1": 286.3649, "r_y1": 465.41299, "r_x2": 286.3649, "r_y2": 456.50644000000005, "r_x3": 70.037018, "r_y3": 456.50644000000005, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 477.36798, "r_x1": 286.3649, "r_y1": 477.36798, "r_x2": 286.3649, "r_y2": 468.46143, "r_x3": 70.037018, "r_y3": 468.46143, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037018, "r_y0": 489.32297, "r_x1": 99.635902, "r_y1": 489.32297, "r_x2": 99.635902, "r_y2": 480.41641, "r_x3": 70.037018, "r_y3": 480.41641, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach." }, { "label": "list_item", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 61.569016, "t": 502.03384, "r": 286.3649, "b": 546.9259500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.982271671295166, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569016, "r_y0": 511.05997, "r_x1": 71.619438, "r_y1": 511.05997, "r_x2": 71.619438, "r_y2": 502.15341, "r_x3": 61.569016, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.132042, "r_y0": 511.05997, "r_x1": 196.10396, "r_y1": 511.05997, "r_x2": 196.10396, "r_y2": 502.15341, "r_x3": 74.132042, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31001, "r_y0": 510.99023, "r_x1": 256.14041, "r_y1": 510.99023, "r_x2": 256.14041, "r_y2": 502.03384, "r_x3": 200.31001, "r_y3": 502.03384, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35001, "r_y0": 511.05997, "r_x1": 286.36237, "r_y1": 511.05997, "r_x2": 286.36237, "r_y2": 502.15341, "r_x3": 260.35001, "r_y3": 502.15341, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 523.01495, "r_x1": 286.3649, "r_y1": 523.01495, "r_x2": 286.3649, "r_y2": 514.1084000000001, "r_x3": 70.037003, "r_y3": 514.1084000000001, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 534.97095, "r_x1": 286.36487, "r_y1": 534.97095, "r_x2": 286.36487, "r_y2": 526.06439, "r_x3": 70.037003, "r_y3": 526.06439, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 546.9259500000001, "r_x1": 161.65305, "r_y1": 546.9259500000001, "r_x2": 161.65305, "r_y2": 538.0193899999999, "r_x3": 70.037003, "r_y3": 538.0193899999999, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works." }, { "label": "list_item", "id": 9, "page_no": 1, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 61.569, "t": 559.63684, "r": 286.36493, "b": 592.57295, "coord_origin": "TOPLEFT" }, "confidence": 0.9802963733673096, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 568.66295, "r_x1": 71.115913, "r_y1": 568.66295, "r_x2": 71.115913, "r_y2": 559.75639, "r_x3": 61.569, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.502647, "r_y0": 568.66295, "r_x1": 116.71199, "r_y1": 568.66295, "r_x2": 116.71199, "r_y2": 559.75639, "r_x3": 73.502647, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.583, "r_y0": 568.59322, "r_x1": 177.68239, "r_y1": 568.59322, "r_x2": 177.68239, "r_y2": 559.63684, "r_x3": 121.583, "r_y3": 559.63684, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55301, "r_y0": 568.66295, "r_x1": 286.36328, "r_y1": 568.66295, "r_x2": 286.36328, "r_y2": 559.75639, "r_x3": 182.55301, "r_y3": 559.75639, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 580.6179500000001, "r_x1": 286.36493, "r_y1": 580.6179500000001, "r_x2": 286.36493, "r_y2": 571.7114, "r_x3": 70.03701, "r_y3": 571.7114, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 592.57295, "r_x1": 82.400597, "r_y1": 592.57295, "r_x2": 82.400597, "r_y2": 583.6664000000001, "r_x3": 70.03701, "r_y3": 583.6664000000001, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity." }, { "label": "list_item", "id": 8, "page_no": 1, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 61.569008000000004, "t": 605.4034, "r": 286.36508, "b": 638.22095, "coord_origin": "TOPLEFT" }, "confidence": 0.9806395173072815, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569008000000004, "r_y0": 614.30995, "r_x1": 72.332527, "r_y1": 614.30995, "r_x2": 72.332527, "r_y2": 605.4034, "r_x3": 61.569008000000004, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.023399, "r_y0": 614.30995, "r_x1": 286.36508, "r_y1": 614.30995, "r_x2": 286.36508, "r_y2": 605.4034, "r_x3": 75.023399, "r_y3": 605.4034, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 626.26495, "r_x1": 286.36487, "r_y1": 626.26495, "r_x2": 286.36487, "r_y2": 617.3584, "r_x3": 70.03701, "r_y3": 617.3584, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03701, "r_y0": 638.22095, "r_x1": 198.05641, "r_y1": 638.22095, "r_x2": 198.05641, "r_y2": 629.31439, "r_x3": 70.03701, "r_y3": 629.31439, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility." }, { "label": "text", "id": 11, "page_no": 1, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.112007, "t": 650.59839, "r": 286.36511, "b": 695.369957, "coord_origin": "TOPLEFT" }, "confidence": 0.9742533564567566, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067009000000006, "r_y0": 659.50494, "r_x1": 286.36496, "r_y1": 659.50494, "r_x2": 286.36496, "r_y2": 650.59839, "r_x3": 62.067009000000006, "r_y3": 650.59839, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 671.45995, "r_x1": 286.36511, "r_y1": 671.45995, "r_x2": 286.36511, "r_y2": 662.55339, "r_x3": 50.112007, "r_y3": 662.55339, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 683.41496, "r_x1": 286.36511, "r_y1": 683.41496, "r_x2": 286.36511, "r_y2": 674.50839, "r_x3": 50.112007, "r_y3": 674.50839, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 695.369957, "r_x1": 286.36511, "r_y1": 695.369957, "r_x2": 286.36511, "r_y2": 686.46339, "r_x3": 50.112007, "r_y3": 686.46339, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe" }, { "label": "footnote", "id": 14, "page_no": 1, "cluster": { "id": 14, "label": "footnote", "bbox": { "l": 60.97100100000001, "t": 705.596275, "r": 183.73055, "b": 712.721542, "coord_origin": "TOPLEFT" }, "confidence": 0.895367443561554, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97100100000001, "r_y0": 712.721542, "r_x1": 183.73055, "r_y1": 712.721542, "r_x2": 183.73055, "r_y2": 705.596275, "r_x3": 60.97100100000001, "r_y3": 705.596275, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "$^{1}$https://github.com/IBM/SynthTabNet" }, { "label": "text", "id": 10, "page_no": 1, "cluster": { "id": 10, "label": "text", "bbox": { "l": 308.862, "t": 75.20836999999995, "r": 545.11511, "b": 108.02495999999985, "coord_origin": "TOPLEFT" }, "confidence": 0.9774322509765625, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 545.11511, "r_y1": 84.11492999999996, "r_x2": 545.11511, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11505, "r_y1": 96.06994999999995, "r_x2": 545.11505, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 508.08417000000003, "r_y1": 108.02495999999985, "r_x2": 508.08417000000003, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community." }, { "label": "section_header", "id": 13, "page_no": 1, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 308.862, "t": 121.73193000000003, "r": 498.28021, "b": 132.47968000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9428724646568298, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 132.47968000000003, "r_x1": 315.5831, "r_y1": 132.47968000000003, "r_x2": 315.5831, "r_y2": 121.73193000000003, "r_x3": 308.862, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54456, "r_y0": 132.47968000000003, "r_x1": 498.28021, "r_y1": 132.47968000000003, "r_x2": 498.28021, "r_y2": 121.73193000000003, "r_x3": 324.54456, "r_y3": 121.73193000000003, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Previous work and State of the Art" }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 142.22136999999998, "r": 545.11517, "b": 330.45502, "coord_origin": "TOPLEFT" }, "confidence": 0.987194836139679, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 151.12793, "r_x1": 545.11493, "r_y1": 151.12793, "r_x2": 545.11493, "r_y2": 142.22136999999998, "r_x3": 320.81699, "r_y3": 142.22136999999998, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 163.08294999999998, "r_x1": 545.11505, "r_y1": 163.08294999999998, "r_x2": 545.11505, "r_y2": 154.17638999999997, "r_x3": 308.862, "r_y3": 154.17638999999997, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 175.03796, "r_x1": 522.55975, "r_y1": 175.03796, "r_x2": 522.55975, "r_y2": 166.13140999999996, "r_x3": 308.862, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 175.03796, "r_x1": 545.11505, "r_y1": 175.03796, "r_x2": 545.11505, "r_y2": 166.13140999999996, "r_x3": 529.62323, "r_y3": 166.13140999999996, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 186.99298, "r_x1": 545.11517, "r_y1": 186.99298, "r_x2": 545.11517, "r_y2": 178.08642999999995, "r_x3": 308.862, "r_y3": 178.08642999999995, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 198.94799999999998, "r_x1": 545.11511, "r_y1": 198.94799999999998, "r_x2": 545.11511, "r_y2": 190.04143999999997, "r_x3": 308.862, "r_y3": 190.04143999999997, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 210.90301999999997, "r_x1": 346.97891, "r_y1": 210.90301999999997, "r_x2": 346.97891, "r_y2": 201.99645999999996, "r_x3": 308.862, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.86929, "r_y0": 210.90301999999997, "r_x1": 545.11511, "r_y1": 210.90301999999997, "r_x2": 545.11511, "r_y2": 201.99645999999996, "r_x3": 354.86929, "r_y3": 201.99645999999996, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 222.85901, "r_x1": 545.11505, "r_y1": 222.85901, "r_x2": 545.11505, "r_y2": 213.95245, "r_x3": 308.862, "r_y3": 213.95245, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 234.81403, "r_x1": 530.9184, "r_y1": 234.81403, "r_x2": 530.9184, "r_y2": 225.90747, "r_x3": 308.862, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92212, "r_y0": 234.81403, "r_x1": 545.11511, "r_y1": 234.81403, "r_x2": 545.11511, "r_y2": 225.90747, "r_x3": 537.92212, "r_y3": 225.90747, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 246.76904000000002, "r_x1": 545.11517, "r_y1": 246.76904000000002, "r_x2": 545.11517, "r_y2": 237.86248999999998, "r_x3": 308.862, "r_y3": 237.86248999999998, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.72406, "r_x1": 545.11511, "r_y1": 258.72406, "r_x2": 545.11511, "r_y2": 249.8175, "r_x3": 308.862, "r_y3": 249.8175, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.67908, "r_x1": 439.8402699999999, "r_y1": 270.67908, "r_x2": 439.8402699999999, "r_y2": 261.77252, "r_x3": 308.862, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.43999999999994, "r_y0": 270.45989999999995, "r_x1": 452.1889, "r_y1": 270.45989999999995, "r_x2": 452.1889, "r_y2": 261.61310000000003, "r_x3": 444.43999999999994, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89001, "r_y0": 270.45989999999995, "r_x1": 470.83392000000003, "r_y1": 270.45989999999995, "r_x2": 470.83392000000003, "r_y2": 261.61310000000003, "r_x3": 455.89001, "r_y3": 261.61310000000003, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83401, "r_y0": 270.67908, "r_x1": 545.11517, "r_y1": 270.67908, "r_x2": 545.11517, "r_y2": 261.77252, "r_x3": 470.83401, "r_y3": 261.77252, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.63406, "r_x1": 545.11511, "r_y1": 282.63406, "r_x2": 545.11511, "r_y2": 273.72748, "r_x3": 308.862, "r_y3": 273.72748, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.59006, "r_x1": 545.11511, "r_y1": 294.59006, "r_x2": 545.11511, "r_y2": 285.6835, "r_x3": 308.862, "r_y3": 285.6835, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 306.54504, "r_x1": 545.11511, "r_y1": 306.54504, "r_x2": 545.11511, "r_y2": 297.63849, "r_x3": 308.862, "r_y3": 297.63849, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 318.50003000000004, "r_x1": 545.11517, "r_y1": 318.50003000000004, "r_x2": 545.11517, "r_y2": 309.59348, "r_x3": 308.862, "r_y3": 309.59348, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 330.45502, "r_x1": 425.92255, "r_y1": 330.45502, "r_x2": 425.92255, "r_y2": 321.54846, "r_x3": 308.862, "r_y3": 321.54846, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc." }, { "label": "text", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.862, "t": 333.56946, "r": 545.11523, "b": 450.0729099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9869040250778198, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 342.47601, "r_x1": 545.11499, "r_y1": 342.47601, "r_x2": 545.11499, "r_y2": 333.56946, "r_x3": 320.81699, "r_y3": 333.56946, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 354.43100000000004, "r_x1": 545.11499, "r_y1": 354.43100000000004, "r_x2": 545.11499, "r_y2": 345.52444, "r_x3": 308.862, "r_y3": 345.52444, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 366.38599, "r_x1": 545.11517, "r_y1": 366.38599, "r_x2": 545.11517, "r_y2": 357.47943, "r_x3": 308.862, "r_y3": 357.47943, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 378.34198, "r_x1": 545.11511, "r_y1": 378.34198, "r_x2": 545.11511, "r_y2": 369.43542, "r_x3": 308.862, "r_y3": 369.43542, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 390.29697, "r_x1": 545.11505, "r_y1": 390.29697, "r_x2": 545.11505, "r_y2": 381.39041, "r_x3": 308.862, "r_y3": 381.39041, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 402.25195, "r_x1": 545.11505, "r_y1": 402.25195, "r_x2": 545.11505, "r_y2": 393.3453999999999, "r_x3": 308.862, "r_y3": 393.3453999999999, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 414.20694, "r_x1": 545.11517, "r_y1": 414.20694, "r_x2": 545.11517, "r_y2": 405.30038, "r_x3": 308.862, "r_y3": 405.30038, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 426.16193, "r_x1": 545.11523, "r_y1": 426.16193, "r_x2": 545.11523, "r_y2": 417.25537, "r_x3": 308.862, "r_y3": 417.25537, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 438.11792, "r_x1": 545.11511, "r_y1": 438.11792, "r_x2": 545.11511, "r_y2": 429.21136000000007, "r_x3": 308.862, "r_y3": 429.21136000000007, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 450.0729099999999, "r_x1": 401.28503, "r_y1": 450.0729099999999, "r_x2": 401.28503, "r_y2": 441.16635, "r_x3": 308.862, "r_y3": 441.16635, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification." }, { "label": "text", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86197, "t": 453.06778, "r": 545.11688, "b": 713.151848, "coord_origin": "TOPLEFT" }, "confidence": 0.9843218326568604, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 462.02417, "r_x1": 423.26236, "r_y1": 462.02417, "r_x2": 423.26236, "r_y2": 453.06778, "r_x3": 320.81699, "r_y3": 453.06778, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.26697, "r_y0": 462.0939, "r_x1": 545.10956, "r_y1": 462.0939, "r_x2": 545.10956, "r_y2": 453.18735, "r_x3": 423.26697, "r_y3": 453.18735, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 474.04889, "r_x1": 545.11511, "r_y1": 474.04889, "r_x2": 545.11511, "r_y2": 465.14233, "r_x3": 308.86197, "r_y3": 465.14233, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 486.00388, "r_x1": 335.7012, "r_y1": 486.00388, "r_x2": 335.7012, "r_y2": 477.09732, "r_x3": 308.86197, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85309, "r_y0": 486.00388, "r_x1": 545.11505, "r_y1": 486.00388, "r_x2": 545.11505, "r_y2": 477.09732, "r_x3": 345.85309, "r_y3": 477.09732, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.95886, "r_x1": 545.11493, "r_y1": 497.95886, "r_x2": 545.11493, "r_y2": 489.05231, "r_x3": 308.86197, "r_y3": 489.05231, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.91385, "r_x1": 545.11499, "r_y1": 509.91385, "r_x2": 545.11499, "r_y2": 501.00729, "r_x3": 308.86197, "r_y3": 501.00729, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.8698400000001, "r_x1": 545.11505, "r_y1": 521.8698400000001, "r_x2": 545.11505, "r_y2": 512.9632899999999, "r_x3": 308.86197, "r_y3": 512.9632899999999, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.82483, "r_x1": 545.11505, "r_y1": 533.82483, "r_x2": 545.11505, "r_y2": 524.91827, "r_x3": 308.86197, "r_y3": 524.91827, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.77983, "r_x1": 420.94119, "r_y1": 545.77983, "r_x2": 420.94119, "r_y2": 536.87328, "r_x3": 308.86197, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59497, "r_y0": 545.56065, "r_x1": 433.5575600000001, "r_y1": 545.56065, "r_x2": 433.5575600000001, "r_y2": 536.1559599999999, "r_x3": 423.59497, "r_y3": 536.1559599999999, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21198, "r_y0": 545.77983, "r_x1": 545.11316, "r_y1": 545.77983, "r_x2": 545.11316, "r_y2": 536.87328, "r_x3": 436.21198, "r_y3": 536.87328, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 557.73483, "r_x1": 545.11511, "r_y1": 557.73483, "r_x2": 545.11511, "r_y2": 548.82828, "r_x3": 308.86197, "r_y3": 548.82828, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 569.68983, "r_x1": 545.11493, "r_y1": 569.68983, "r_x2": 545.11493, "r_y2": 560.78328, "r_x3": 308.86197, "r_y3": 560.78328, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 581.6448399999999, "r_x1": 545.11499, "r_y1": 581.6448399999999, "r_x2": 545.11499, "r_y2": 572.73828, "r_x3": 308.86197, "r_y3": 572.73828, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 593.60083, "r_x1": 545.11505, "r_y1": 593.60083, "r_x2": 545.11505, "r_y2": 584.69427, "r_x3": 308.86197, "r_y3": 584.69427, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 605.55583, "r_x1": 497.07541, "r_y1": 605.55583, "r_x2": 497.07541, "r_y2": 596.6492800000001, "r_x3": 308.86197, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.80496, "r_y0": 605.33665, "r_x1": 509.76755, "r_y1": 605.33665, "r_x2": 509.76755, "r_y2": 595.93196, "r_x3": 499.80496, "r_y3": 595.93196, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.50098, "r_y0": 605.55583, "r_x1": 545.10852, "r_y1": 605.55583, "r_x2": 545.10852, "r_y2": 596.6492800000001, "r_x3": 512.50098, "r_y3": 596.6492800000001, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 617.5108299999999, "r_x1": 545.11511, "r_y1": 617.5108299999999, "r_x2": 545.11511, "r_y2": 608.60428, "r_x3": 308.86197, "r_y3": 608.60428, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.46584, "r_x1": 545.11505, "r_y1": 629.46584, "r_x2": 545.11505, "r_y2": 620.55928, "r_x3": 308.86197, "r_y3": 620.55928, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.42084, "r_x1": 364.78201, "r_y1": 641.42084, "r_x2": 364.78201, "r_y2": 632.51428, "r_x3": 308.86197, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57397, "r_y0": 641.1917, "r_x1": 415.61362, "r_y1": 641.1917, "r_x2": 415.61362, "r_y2": 632.60394, "r_x3": 367.57397, "r_y3": 632.60394, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61298, "r_y0": 641.42084, "r_x1": 545.11688, "r_y1": 641.42084, "r_x2": 545.11688, "r_y2": 632.51428, "r_x3": 415.61298, "r_y3": 632.51428, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.37584, "r_x1": 545.11511, "r_y1": 653.37584, "r_x2": 545.11511, "r_y2": 644.46928, "r_x3": 308.86197, "r_y3": 644.46928, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 665.1027, "r_x1": 373.59894, "r_y1": 665.1027, "r_x2": 373.59894, "r_y2": 656.51494, "r_x3": 308.86197, "r_y3": 656.51494, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.90698, "r_y0": 665.33184, "r_x1": 545.11548, "r_y1": 665.33184, "r_x2": 545.11548, "r_y2": 656.4252799999999, "r_x3": 376.90698, "r_y3": 656.4252799999999, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28684, "r_x1": 545.11517, "r_y1": 677.28684, "r_x2": 545.11517, "r_y2": 668.38028, "r_x3": 308.862, "r_y3": 668.38028, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.0127, "r_x1": 356.90164, "r_y1": 689.0127, "r_x2": 356.90164, "r_y2": 680.42494, "r_x3": 308.862, "r_y3": 680.42494, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13101, "r_y0": 689.24184, "r_x1": 545.1153, "r_y1": 689.24184, "r_x2": 545.1153, "r_y2": 680.33528, "r_x3": 357.13101, "r_y3": 680.33528, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196846, "r_x1": 545.11511, "r_y1": 701.196846, "r_x2": 545.11511, "r_y2": 692.290283, "r_x3": 308.862, "r_y3": 692.290283, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151848, "r_x1": 545.11517, "r_y1": 713.151848, "r_x2": 545.11517, "r_y2": 704.245285, "r_x3": 308.862, "r_y3": 704.245285, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the" } ], "headers": [ { "label": "page_footer", "id": 15, "page_no": 1, "cluster": { "id": 15, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133282, "r": 300.10229, "b": 743.039845, "coord_origin": "TOPLEFT" }, "confidence": 0.8778094053268433, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039845, "r_x1": 300.10229, "r_y1": 743.039845, "r_x2": 300.10229, "r_y2": 734.133282, "r_x3": 295.121, "r_y3": 734.133282, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" } ] } }, { "page_no": 2, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 250.15102, "r_y1": 84.11492999999996, "r_x2": 250.15102, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.12591999999995, "r_x1": 70.365845, "r_y1": 96.12591999999995, "r_x2": 70.365845, "r_y2": 87.21935999999994, "r_x3": 62.067001, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.931198, "r_y0": 96.12591999999995, "r_x1": 110.95348000000001, "r_y1": 96.12591999999995, "r_x2": 110.95348000000001, "r_y2": 87.21935999999994, "r_x3": 76.931198, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54498, "r_y0": 96.12591999999995, "r_x1": 136.25848, "r_y1": 96.12591999999995, "r_x2": 136.25848, "r_y2": 87.21935999999994, "r_x3": 118.54498, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82384, "r_y0": 96.12591999999995, "r_x1": 175.37166, "r_y1": 96.12591999999995, "r_x2": 175.37166, "r_y2": 87.21935999999994, "r_x3": 142.82384, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.94698, "r_y0": 96.12591999999995, "r_x1": 232.83594000000002, "r_y1": 96.12591999999995, "r_x2": 232.83594000000002, "r_y2": 87.21935999999994, "r_x3": 181.94698, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41125, "r_y0": 96.12591999999995, "r_x1": 265.41364, "r_y1": 96.12591999999995, "r_x2": 265.41364, "r_y2": 87.21935999999994, "r_x3": 239.41125, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.979, "r_y0": 96.12591999999995, "r_x1": 286.36499, "r_y1": 96.12591999999995, "r_x2": 286.36499, "r_y2": 87.21935999999994, "r_x3": 271.979, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.08092999999997, "r_x1": 286.36505, "r_y1": 108.08092999999997, "r_x2": 286.36505, "r_y2": 99.17437999999993, "r_x3": 50.112, "r_y3": 99.17437999999993, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.03692999999998, "r_x1": 286.36511, "r_y1": 120.03692999999998, "r_x2": 286.36511, "r_y2": 111.13036999999997, "r_x3": 50.112, "r_y3": 111.13036999999997, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.99194, "r_x1": 286.36505, "r_y1": 131.99194, "r_x2": 286.36505, "r_y2": 123.08538999999996, "r_x3": 50.112, "r_y3": 123.08538999999996, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.94696, "r_x1": 286.36514, "r_y1": 143.94696, "r_x2": 286.36514, "r_y2": 135.04040999999995, "r_x3": 50.112, "r_y3": 135.04040999999995, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.90197999999998, "r_x1": 286.36511, "r_y1": 155.90197999999998, "r_x2": 286.36511, "r_y2": 146.99541999999997, "r_x3": 50.112, "r_y3": 146.99541999999997, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 167.85699, "r_x1": 286.36505, "r_y1": 167.85699, "r_x2": 286.36505, "r_y2": 158.95043999999996, "r_x3": 50.112, "r_y3": 158.95043999999996, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 179.81201, "r_x1": 286.36508, "r_y1": 179.81201, "r_x2": 286.36508, "r_y2": 170.90545999999995, "r_x3": 50.112, "r_y3": 170.90545999999995, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 191.76801, "r_x1": 286.36508, "r_y1": 191.76801, "r_x2": 286.36508, "r_y2": 182.86145, "r_x3": 50.112, "r_y3": 182.86145, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 203.72302000000002, "r_x1": 286.36511, "r_y1": 203.72302000000002, "r_x2": 286.36511, "r_y2": 194.81646999999998, "r_x3": 50.112, "r_y3": 194.81646999999998, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 215.67804, "r_x1": 286.36511, "r_y1": 215.67804, "r_x2": 286.36511, "r_y2": 206.77148, "r_x3": 50.112, "r_y3": 206.77148, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 227.63306, "r_x1": 286.36505, "r_y1": 227.63306, "r_x2": 286.36505, "r_y2": 218.7265, "r_x3": 50.112, "r_y3": 218.7265, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 239.58807000000002, "r_x1": 286.36505, "r_y1": 239.58807000000002, "r_x2": 286.36505, "r_y2": 230.68151999999998, "r_x3": 50.112, "r_y3": 230.68151999999998, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 251.54309, "r_x1": 286.36511, "r_y1": 251.54309, "r_x2": 286.36511, "r_y2": 242.63653999999997, "r_x3": 50.112, "r_y3": 242.63653999999997, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 263.49908000000005, "r_x1": 286.36508, "r_y1": 263.49908000000005, "r_x2": 286.36508, "r_y2": 254.59253, "r_x3": 50.112, "r_y3": 254.59253, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 275.45410000000004, "r_x1": 64.776947, "r_y1": 275.45410000000004, "r_x2": 64.776947, "r_y2": 266.54755, "r_x3": 50.112, "r_y3": 266.54755, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 287.39536, "r_x1": 171.56593, "r_y1": 287.39536, "r_x2": 171.56593, "r_y2": 278.43895999999995, "r_x3": 62.067001, "r_y3": 278.43895999999995, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.56799, "r_y0": 287.46509, "r_x1": 174.3376, "r_y1": 287.46509, "r_x2": 174.3376, "r_y2": 278.55853, "r_x3": 171.56799, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.18687, "r_y0": 287.46509, "r_x1": 286.35709, "r_y1": 287.46509, "r_x2": 286.35709, "r_y2": 278.55853, "r_x3": 185.18687, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 299.42108, "r_x1": 286.36511, "r_y1": 299.42108, "r_x2": 286.36511, "r_y2": 290.51453000000004, "r_x3": 50.111992, "r_y3": 290.51453000000004, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 311.37607, "r_x1": 131.16771, "r_y1": 311.37607, "r_x2": 131.16771, "r_y2": 302.46950999999996, "r_x3": 50.111992, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.84888, "r_y0": 311.37607, "r_x1": 286.36508, "r_y1": 311.37607, "r_x2": 286.36508, "r_y2": 302.46950999999996, "r_x3": 138.84888, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 323.33105, "r_x1": 286.36505, "r_y1": 323.33105, "r_x2": 286.36505, "r_y2": 314.4245, "r_x3": 50.111992, "r_y3": 314.4245, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 335.28604, "r_x1": 286.36508, "r_y1": 335.28604, "r_x2": 286.36508, "r_y2": 326.37949000000003, "r_x3": 50.111992, "r_y3": 326.37949000000003, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 347.2410300000001, "r_x1": 286.36505, "r_y1": 347.2410300000001, "r_x2": 286.36505, "r_y2": 338.33447, "r_x3": 50.111992, "r_y3": 338.33447, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 359.19601, "r_x1": 286.36505, "r_y1": 359.19601, "r_x2": 286.36505, "r_y2": 350.28946, "r_x3": 50.111992, "r_y3": 350.28946, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 371.15201, "r_x1": 286.36508, "r_y1": 371.15201, "r_x2": 286.36508, "r_y2": 362.24545000000006, "r_x3": 50.111992, "r_y3": 362.24545000000006, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 383.10699, "r_x1": 286.36508, "r_y1": 383.10699, "r_x2": 286.36508, "r_y2": 374.20044, "r_x3": 50.111992, "r_y3": 374.20044, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 395.06198, "r_x1": 286.36508, "r_y1": 395.06198, "r_x2": 286.36508, "r_y2": 386.15542999999997, "r_x3": 50.111992, "r_y3": 386.15542999999997, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 407.01697, "r_x1": 286.36508, "r_y1": 407.01697, "r_x2": 286.36508, "r_y2": 398.11041000000006, "r_x3": 50.111992, "r_y3": 398.11041000000006, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 418.97195, "r_x1": 286.36508, "r_y1": 418.97195, "r_x2": 286.36508, "r_y2": 410.0654, "r_x3": 50.111992, "r_y3": 410.0654, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 430.92694, "r_x1": 286.36505, "r_y1": 430.92694, "r_x2": 286.36505, "r_y2": 422.02038999999996, "r_x3": 50.111992, "r_y3": 422.02038999999996, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 442.88293, "r_x1": 198.2359, "r_y1": 442.88293, "r_x2": 198.2359, "r_y2": 433.97638, "r_x3": 50.111992, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.92703, "r_y0": 442.88293, "r_x1": 286.36505, "r_y1": 442.88293, "r_x2": 286.36505, "r_y2": 433.97638, "r_x3": 205.92703, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 454.83792000000005, "r_x1": 286.36508, "r_y1": 454.83792000000005, "r_x2": 286.36508, "r_y2": 445.93137, "r_x3": 50.111992, "r_y3": 445.93137, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 466.79291, "r_x1": 286.36505, "r_y1": 466.79291, "r_x2": 286.36505, "r_y2": 457.88635, "r_x3": 50.111992, "r_y3": 457.88635, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 478.74789, "r_x1": 286.36505, "r_y1": 478.74789, "r_x2": 286.36505, "r_y2": 469.84134, "r_x3": 50.111992, "r_y3": 469.84134, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 490.70288, "r_x1": 186.49998, "r_y1": 490.70288, "r_x2": 186.49998, "r_y2": 481.79633, "r_x3": 50.111992, "r_y3": 481.79633, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066994, "r_y0": 502.64514, "r_x1": 252.88068000000004, "r_y1": 502.64514, "r_x2": 252.88068000000004, "r_y2": 493.68875, "r_x3": 62.066994, "r_y3": 493.68875, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88199, "r_y0": 502.71487, "r_x1": 286.36627, "r_y1": 502.71487, "r_x2": 286.36627, "r_y2": 493.80832, "r_x3": 252.88199, "r_y3": 493.80832, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 514.66986, "r_x1": 286.36505, "r_y1": 514.66986, "r_x2": 286.36505, "r_y2": 505.76331, "r_x3": 50.111984, "r_y3": 505.76331, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 526.6248499999999, "r_x1": 286.36505, "r_y1": 526.6248499999999, "r_x2": 286.36505, "r_y2": 517.71829, "r_x3": 50.111984, "r_y3": 517.71829, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 538.57985, "r_x1": 286.36508, "r_y1": 538.57985, "r_x2": 286.36508, "r_y2": 529.67328, "r_x3": 50.111984, "r_y3": 529.67328, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 550.53584, "r_x1": 286.36508, "r_y1": 550.53584, "r_x2": 286.36508, "r_y2": 541.62929, "r_x3": 50.111984, "r_y3": 541.62929, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 562.4908399999999, "r_x1": 286.36511, "r_y1": 562.4908399999999, "r_x2": 286.36511, "r_y2": 553.58429, "r_x3": 50.111984, "r_y3": 553.58429, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 574.44585, "r_x1": 286.36511, "r_y1": 574.44585, "r_x2": 286.36511, "r_y2": 565.5392899999999, "r_x3": 50.111984, "r_y3": 565.5392899999999, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 586.40085, "r_x1": 286.36502, "r_y1": 586.40085, "r_x2": 286.36502, "r_y2": 577.49429, "r_x3": 50.111984, "r_y3": 577.49429, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 598.35585, "r_x1": 286.36505, "r_y1": 598.35585, "r_x2": 286.36505, "r_y2": 589.4493, "r_x3": 50.111984, "r_y3": 589.4493, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 610.31085, "r_x1": 286.36502, "r_y1": 610.31085, "r_x2": 286.36502, "r_y2": 601.4043, "r_x3": 50.111984, "r_y3": 601.4043, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 622.26685, "r_x1": 175.98943, "r_y1": 622.26685, "r_x2": 175.98943, "r_y2": 613.36029, "r_x3": 50.111984, "r_y3": 613.36029, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 646.6925699999999, "r_x1": 57.82375699999999, "r_y1": 646.6925699999999, "r_x2": 57.82375699999999, "r_y2": 635.94484, "r_x3": 50.111984, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.106125, "r_y0": 646.6925699999999, "r_x1": 105.22546, "r_y1": 646.6925699999999, "r_x2": 105.22546, "r_y2": 635.94484, "r_x3": 68.106125, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 665.33186, "r_x1": 286.36493, "r_y1": 665.33186, "r_x2": 286.36493, "r_y2": 656.42529, "r_x3": 62.06698600000001, "r_y3": 656.42529, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 677.2868599999999, "r_x1": 286.36508, "r_y1": 677.2868599999999, "r_x2": 286.36508, "r_y2": 668.38029, "r_x3": 50.111984, "r_y3": 668.38029, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 689.24186, "r_x1": 286.36502, "r_y1": 689.24186, "r_x2": 286.36502, "r_y2": 680.3353, "r_x3": 50.111984, "r_y3": 680.3353, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 701.196861, "r_x1": 166.24602, "r_y1": 701.196861, "r_x2": 166.24602, "r_y2": 692.290298, "r_x3": 50.111984, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.68808, "r_y0": 701.196861, "r_x1": 286.36508, "r_y1": 701.196861, "r_x2": 286.36508, "r_y2": 692.290298, "r_x3": 173.68808, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 713.151863, "r_x1": 286.36505, "r_y1": 713.151863, "r_x2": 286.36505, "r_y2": 704.2453, "r_x3": 50.111984, "r_y3": 704.2453, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.79849, "r_y0": 88.55975000000001, "r_x1": 486.84909, "r_y1": 88.55975000000001, "r_x2": 486.84909, "r_y2": 79.81176999999991, "r_x3": 380.79849, "r_y3": 79.81176999999991, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.76776, "r_y0": 250.77495999999996, "r_x1": 469.78748, "r_y1": 250.77495999999996, "r_x2": 469.78748, "r_y2": 242.02697999999998, "r_x3": 396.76776, "r_y3": 242.02697999999998, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.97653, "r_y0": 239.255, "r_x1": 324.79254, "r_y1": 239.255, "r_x2": 324.79254, "r_y2": 233.42296999999996, "r_x3": 320.97653, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.483, "r_y0": 239.255, "r_x1": 418.11319, "r_y1": 239.255, "r_x2": 418.11319, "r_y2": 233.42296999999996, "r_x3": 410.483, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.84949, "r_y0": 239.255, "r_x1": 508.47968000000003, "r_y1": 239.255, "r_x2": 508.47968000000003, "r_y2": 233.42296999999996, "r_x3": 500.84949, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.29999, "r_y0": 239.255, "r_x1": 372.93018, "r_y1": 239.255, "r_x2": 372.93018, "r_y2": 233.42296999999996, "r_x3": 365.29999, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.66626, "r_y0": 239.255, "r_x1": 463.29645, "r_y1": 239.255, "r_x2": 463.29645, "r_y2": 233.42296999999996, "r_x3": 455.66626, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.03528, "r_y0": 239.255, "r_x1": 549.66547, "r_y1": 239.255, "r_x2": 549.66547, "r_y2": 233.42296999999996, "r_x3": 542.03528, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04474, "r_y0": 236.27819999999997, "r_x1": 319.86075, "r_y1": 236.27819999999997, "r_x2": 319.86075, "r_y2": 230.44617000000005, "r_x3": 316.04474, "r_y3": 230.44617000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.62521, "r_y0": 204.52277000000004, "r_x1": 316.44122, "r_y1": 204.52277000000004, "r_x2": 316.44122, "r_y2": 198.69073000000003, "r_x3": 312.62521, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.43942, "r_y0": 204.52277000000004, "r_x1": 320.2554, "r_y1": 204.52277000000004, "r_x2": 320.2554, "r_y2": 198.69073000000003, "r_x3": 316.43942, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.14951, "r_y0": 173.92998999999998, "r_x1": 316.96552, "r_y1": 173.92998999999998, "r_x2": 316.96552, "r_y2": 168.09795999999994, "r_x3": 313.14951, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96371, "r_y0": 173.92998999999998, "r_x1": 320.77969, "r_y1": 173.92998999999998, "r_x2": 320.77969, "r_y2": 168.09795999999994, "r_x3": 316.96371, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.92972, "r_y0": 142.41974000000005, "r_x1": 316.74573, "r_y1": 142.41974000000005, "r_x2": 316.74573, "r_y2": 136.58771000000002, "r_x3": 312.92972, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74393, "r_y0": 142.41974000000005, "r_x1": 320.55991, "r_y1": 142.41974000000005, "r_x2": 320.55991, "r_y2": 136.58771000000002, "r_x3": 316.74393, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 111.43377999999996, "r_x1": 316.29828, "r_y1": 111.43377999999996, "r_x2": 316.29828, "r_y2": 105.60175000000004, "r_x3": 312.48227, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 111.43377999999996, "r_x1": 320.11246, "r_y1": 111.43377999999996, "r_x2": 320.11246, "r_y2": 105.60175000000004, "r_x3": 316.29648, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 218.09124999999995, "r_x1": 316.29828, "r_y1": 218.09124999999995, "r_x2": 316.29828, "r_y2": 212.25922000000003, "r_x3": 312.48227, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 218.09124999999995, "r_x1": 320.11246, "r_y1": 218.09124999999995, "r_x2": 320.11246, "r_y2": 212.25922000000003, "r_x3": 316.29648, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.07639, "r_y0": 189.55402000000004, "r_x1": 316.8924, "r_y1": 189.55402000000004, "r_x2": 316.8924, "r_y2": 183.72198000000003, "r_x3": 313.07639, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89059, "r_y0": 189.55402000000004, "r_x1": 320.70657, "r_y1": 189.55402000000004, "r_x2": 320.70657, "r_y2": 183.72198000000003, "r_x3": 316.89059, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76321, "r_y0": 158.30602999999996, "r_x1": 316.57922, "r_y1": 158.30602999999996, "r_x2": 316.57922, "r_y2": 152.47400000000005, "r_x3": 312.76321, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.57742, "r_y0": 158.30602999999996, "r_x1": 320.3934, "r_y1": 158.30602999999996, "r_x2": 320.3934, "r_y2": 152.47400000000005, "r_x3": 316.57742, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.19775, "r_y0": 126.40252999999996, "r_x1": 316.01376, "r_y1": 126.40252999999996, "r_x2": 316.01376, "r_y2": 120.57050000000004, "r_x3": 312.19775, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01196, "r_y0": 126.40252999999996, "r_x1": 319.82794, "r_y1": 126.40252999999996, "r_x2": 319.82794, "r_y2": 120.57050000000004, "r_x3": 316.01196, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8165, "r_y0": 95.94073000000003, "r_x1": 316.63251, "r_y1": 95.94073000000003, "r_x2": 316.63251, "r_y2": 90.1087, "r_x3": 312.8165, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63071, "r_y0": 95.94073000000003, "r_x1": 320.44669, "r_y1": 95.94073000000003, "r_x2": 320.44669, "r_y2": 90.1087, "r_x3": 316.63071, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17426, "r_y0": 230.01727000000005, "r_x1": 536.94427, "r_y1": 230.01727000000005, "r_x2": 536.94427, "r_y2": 222.72729000000004, "r_x3": 532.17426, "r_y3": 222.72729000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.87952, "r_y0": 115.55700999999999, "r_x1": 547.61249, "r_y1": 115.55700999999999, "r_x2": 547.61249, "r_y2": 108.26702999999986, "r_x3": 532.87952, "r_y3": 108.26702999999986, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.7735, "r_y0": 138.07097999999996, "r_x1": 542.73877, "r_y1": 138.07097999999996, "r_x2": 542.73877, "r_y2": 130.78101000000004, "r_x3": 532.7735, "r_y3": 130.78101000000004, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.79901, "r_y0": 161.21349999999995, "r_x1": 542.76428, "r_y1": 161.21349999999995, "r_x2": 542.76428, "r_y2": 153.92352000000005, "r_x3": 532.79901, "r_y3": 153.92352000000005, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.5705, "r_y0": 184.04796999999996, "r_x1": 542.53577, "r_y1": 184.04796999999996, "r_x2": 542.53577, "r_y2": 176.75800000000004, "r_x3": 532.5705, "r_y3": 176.75800000000004, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.14551, "r_y0": 206.93628, "r_x1": 542.11078, "r_y1": 206.93628, "r_x2": 542.11078, "r_y2": 199.6463, "r_x3": 532.14551, "r_y3": 199.6463, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 276.74292, "r_x1": 346.06238, "r_y1": 276.74292, "r_x2": 346.06238, "r_y2": 267.83636, "r_x3": 308.862, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49072, "r_y0": 276.74292, "r_x1": 545.11511, "r_y1": 276.74292, "r_x2": 545.11511, "r_y2": 267.83636, "r_x3": 354.49072, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 288.6979099999999, "r_x1": 498.56989, "r_y1": 288.6979099999999, "r_x2": 498.56989, "r_y2": 279.79132000000004, "r_x3": 308.862, "r_y3": 279.79132000000004, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 326.37991, "r_x1": 437.27002, "r_y1": 326.37991, "r_x2": 437.27002, "r_y2": 317.47336, "r_x3": 308.862, "r_y3": 317.47336, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 340.43793, "r_x1": 545.11505, "r_y1": 340.43793, "r_x2": 545.11505, "r_y2": 331.53137, "r_x3": 320.81699, "r_y3": 331.53137, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 352.39291, "r_x1": 545.11517, "r_y1": 352.39291, "r_x2": 545.11517, "r_y2": 343.48635999999993, "r_x3": 308.862, "r_y3": 343.48635999999993, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 364.34890999999993, "r_x1": 545.11505, "r_y1": 364.34890999999993, "r_x2": 545.11505, "r_y2": 355.44235, "r_x3": 308.862, "r_y3": 355.44235, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 376.30389, "r_x1": 545.11505, "r_y1": 376.30389, "r_x2": 545.11505, "r_y2": 367.39734, "r_x3": 308.862, "r_y3": 367.39734, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 388.25888, "r_x1": 545.11511, "r_y1": 388.25888, "r_x2": 545.11511, "r_y2": 379.35233, "r_x3": 308.862, "r_y3": 379.35233, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.21386999999993, "r_x1": 545.11511, "r_y1": 400.21386999999993, "r_x2": 545.11511, "r_y2": 391.30731, "r_x3": 308.862, "r_y3": 391.30731, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.16885, "r_x1": 545.11505, "r_y1": 412.16885, "r_x2": 545.11505, "r_y2": 403.26230000000004, "r_x3": 308.862, "r_y3": 403.26230000000004, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.12384, "r_x1": 545.11511, "r_y1": 424.12384, "r_x2": 545.11511, "r_y2": 415.21729, "r_x3": 308.862, "r_y3": 415.21729, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.0798300000001, "r_x1": 545.11517, "r_y1": 436.0798300000001, "r_x2": 545.11517, "r_y2": 427.17328, "r_x3": 308.862, "r_y3": 427.17328, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.03482, "r_x1": 545.11517, "r_y1": 448.03482, "r_x2": 545.11517, "r_y2": 439.12827, "r_x3": 308.862, "r_y3": 439.12827, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 459.98981000000003, "r_x1": 545.11511, "r_y1": 459.98981000000003, "r_x2": 545.11511, "r_y2": 451.08325, "r_x3": 308.862, "r_y3": 451.08325, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 471.94479, "r_x1": 545.11505, "r_y1": 471.94479, "r_x2": 545.11505, "r_y2": 463.03824, "r_x3": 308.862, "r_y3": 463.03824, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 483.89978, "r_x1": 545.11511, "r_y1": 483.89978, "r_x2": 545.11511, "r_y2": 474.99323, "r_x3": 308.862, "r_y3": 474.99323, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 495.85577, "r_x1": 545.11511, "r_y1": 495.85577, "r_x2": 545.11511, "r_y2": 486.94922, "r_x3": 308.862, "r_y3": 486.94922, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 507.81076, "r_x1": 545.11511, "r_y1": 507.81076, "r_x2": 545.11511, "r_y2": 498.90421, "r_x3": 308.862, "r_y3": 498.90421, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 519.76575, "r_x1": 545.11517, "r_y1": 519.76575, "r_x2": 545.11517, "r_y2": 510.85919, "r_x3": 308.862, "r_y3": 510.85919, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 531.72073, "r_x1": 545.11517, "r_y1": 531.72073, "r_x2": 545.11517, "r_y2": 522.8141800000001, "r_x3": 308.862, "r_y3": 522.8141800000001, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 543.67574, "r_x1": 545.11505, "r_y1": 543.67574, "r_x2": 545.11505, "r_y2": 534.76917, "r_x3": 308.862, "r_y3": 534.76917, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 555.6307400000001, "r_x1": 545.11511, "r_y1": 555.6307400000001, "r_x2": 545.11511, "r_y2": 546.72418, "r_x3": 308.862, "r_y3": 546.72418, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 567.58673, "r_x1": 545.11511, "r_y1": 567.58673, "r_x2": 545.11511, "r_y2": 558.6801800000001, "r_x3": 308.862, "r_y3": 558.6801800000001, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 579.54173, "r_x1": 545.11505, "r_y1": 579.54173, "r_x2": 545.11505, "r_y2": 570.63518, "r_x3": 308.862, "r_y3": 570.63518, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 591.49673, "r_x1": 545.11499, "r_y1": 591.49673, "r_x2": 545.11499, "r_y2": 582.59018, "r_x3": 308.862, "r_y3": 582.59018, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 603.45174, "r_x1": 545.11517, "r_y1": 603.45174, "r_x2": 545.11517, "r_y2": 594.54518, "r_x3": 308.862, "r_y3": 594.54518, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 615.40674, "r_x1": 545.11511, "r_y1": 615.40674, "r_x2": 545.11511, "r_y2": 606.50018, "r_x3": 308.862, "r_y3": 606.50018, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 627.36174, "r_x1": 348.16446, "r_y1": 627.36174, "r_x2": 348.16446, "r_y2": 618.45518, "r_x3": 308.862, "r_y3": 618.45518, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 641.42075, "r_x1": 545.11487, "r_y1": 641.42075, "r_x2": 545.11487, "r_y2": 632.51419, "r_x3": 320.81699, "r_y3": 632.51419, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.37575, "r_x1": 545.11511, "r_y1": 653.37575, "r_x2": 545.11511, "r_y2": 644.46919, "r_x3": 308.862, "r_y3": 644.46919, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.33076, "r_x1": 545.11511, "r_y1": 665.33076, "r_x2": 545.11511, "r_y2": 656.42419, "r_x3": 308.862, "r_y3": 656.42419, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28676, "r_x1": 545.11499, "r_y1": 677.28676, "r_x2": 545.11499, "r_y2": 668.38019, "r_x3": 308.862, "r_y3": 668.38019, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24176, "r_x1": 545.11505, "r_y1": 689.24176, "r_x2": 545.11505, "r_y2": 680.33519, "r_x3": 308.862, "r_y3": 680.33519, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196762, "r_x1": 545.11505, "r_y1": 701.196762, "r_x2": 545.11505, "r_y2": 692.290192, "r_x3": 308.862, "r_y3": 692.290192, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151764, "r_x1": 545.11511, "r_y1": 713.151764, "r_x2": 545.11511, "r_y2": 704.245193, "r_x3": 308.862, "r_y3": 704.245193, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039761, "r_x1": 300.10229, "r_y1": 743.039761, "r_x2": 300.10229, "r_y2": 734.133198, "r_x3": 295.121, "r_y3": 734.133198, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 250.15102, "b": 84.11492999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.8767216801643372, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 250.15102, "r_y1": 84.11492999999996, "r_x2": 250.15102, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "text", "bbox": { "l": 50.112, "t": 87.21935999999994, "r": 286.36514, "b": 275.45410000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9822593927383423, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.12591999999995, "r_x1": 70.365845, "r_y1": 96.12591999999995, "r_x2": 70.365845, "r_y2": 87.21935999999994, "r_x3": 62.067001, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.931198, "r_y0": 96.12591999999995, "r_x1": 110.95348000000001, "r_y1": 96.12591999999995, "r_x2": 110.95348000000001, "r_y2": 87.21935999999994, "r_x3": 76.931198, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54498, "r_y0": 96.12591999999995, "r_x1": 136.25848, "r_y1": 96.12591999999995, "r_x2": 136.25848, "r_y2": 87.21935999999994, "r_x3": 118.54498, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82384, "r_y0": 96.12591999999995, "r_x1": 175.37166, "r_y1": 96.12591999999995, "r_x2": 175.37166, "r_y2": 87.21935999999994, "r_x3": 142.82384, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.94698, "r_y0": 96.12591999999995, "r_x1": 232.83594000000002, "r_y1": 96.12591999999995, "r_x2": 232.83594000000002, "r_y2": 87.21935999999994, "r_x3": 181.94698, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41125, "r_y0": 96.12591999999995, "r_x1": 265.41364, "r_y1": 96.12591999999995, "r_x2": 265.41364, "r_y2": 87.21935999999994, "r_x3": 239.41125, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.979, "r_y0": 96.12591999999995, "r_x1": 286.36499, "r_y1": 96.12591999999995, "r_x2": 286.36499, "r_y2": 87.21935999999994, "r_x3": 271.979, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.08092999999997, "r_x1": 286.36505, "r_y1": 108.08092999999997, "r_x2": 286.36505, "r_y2": 99.17437999999993, "r_x3": 50.112, "r_y3": 99.17437999999993, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.03692999999998, "r_x1": 286.36511, "r_y1": 120.03692999999998, "r_x2": 286.36511, "r_y2": 111.13036999999997, "r_x3": 50.112, "r_y3": 111.13036999999997, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.99194, "r_x1": 286.36505, "r_y1": 131.99194, "r_x2": 286.36505, "r_y2": 123.08538999999996, "r_x3": 50.112, "r_y3": 123.08538999999996, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.94696, "r_x1": 286.36514, "r_y1": 143.94696, "r_x2": 286.36514, "r_y2": 135.04040999999995, "r_x3": 50.112, "r_y3": 135.04040999999995, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.90197999999998, "r_x1": 286.36511, "r_y1": 155.90197999999998, "r_x2": 286.36511, "r_y2": 146.99541999999997, "r_x3": 50.112, "r_y3": 146.99541999999997, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 167.85699, "r_x1": 286.36505, "r_y1": 167.85699, "r_x2": 286.36505, "r_y2": 158.95043999999996, "r_x3": 50.112, "r_y3": 158.95043999999996, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 179.81201, "r_x1": 286.36508, "r_y1": 179.81201, "r_x2": 286.36508, "r_y2": 170.90545999999995, "r_x3": 50.112, "r_y3": 170.90545999999995, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 191.76801, "r_x1": 286.36508, "r_y1": 191.76801, "r_x2": 286.36508, "r_y2": 182.86145, "r_x3": 50.112, "r_y3": 182.86145, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 203.72302000000002, "r_x1": 286.36511, "r_y1": 203.72302000000002, "r_x2": 286.36511, "r_y2": 194.81646999999998, "r_x3": 50.112, "r_y3": 194.81646999999998, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 215.67804, "r_x1": 286.36511, "r_y1": 215.67804, "r_x2": 286.36511, "r_y2": 206.77148, "r_x3": 50.112, "r_y3": 206.77148, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 227.63306, "r_x1": 286.36505, "r_y1": 227.63306, "r_x2": 286.36505, "r_y2": 218.7265, "r_x3": 50.112, "r_y3": 218.7265, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 239.58807000000002, "r_x1": 286.36505, "r_y1": 239.58807000000002, "r_x2": 286.36505, "r_y2": 230.68151999999998, "r_x3": 50.112, "r_y3": 230.68151999999998, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 251.54309, "r_x1": 286.36511, "r_y1": 251.54309, "r_x2": 286.36511, "r_y2": 242.63653999999997, "r_x3": 50.112, "r_y3": 242.63653999999997, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 263.49908000000005, "r_x1": 286.36508, "r_y1": 263.49908000000005, "r_x2": 286.36508, "r_y2": 254.59253, "r_x3": 50.112, "r_y3": 254.59253, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 275.45410000000004, "r_x1": 64.776947, "r_y1": 275.45410000000004, "r_x2": 64.776947, "r_y2": 266.54755, "r_x3": 50.112, "r_y3": 266.54755, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 50.111992, "t": 278.43895999999995, "r": 286.36511, "b": 490.70288, "coord_origin": "TOPLEFT" }, "confidence": 0.9878450036048889, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 287.39536, "r_x1": 171.56593, "r_y1": 287.39536, "r_x2": 171.56593, "r_y2": 278.43895999999995, "r_x3": 62.067001, "r_y3": 278.43895999999995, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.56799, "r_y0": 287.46509, "r_x1": 174.3376, "r_y1": 287.46509, "r_x2": 174.3376, "r_y2": 278.55853, "r_x3": 171.56799, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.18687, "r_y0": 287.46509, "r_x1": 286.35709, "r_y1": 287.46509, "r_x2": 286.35709, "r_y2": 278.55853, "r_x3": 185.18687, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 299.42108, "r_x1": 286.36511, "r_y1": 299.42108, "r_x2": 286.36511, "r_y2": 290.51453000000004, "r_x3": 50.111992, "r_y3": 290.51453000000004, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 311.37607, "r_x1": 131.16771, "r_y1": 311.37607, "r_x2": 131.16771, "r_y2": 302.46950999999996, "r_x3": 50.111992, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.84888, "r_y0": 311.37607, "r_x1": 286.36508, "r_y1": 311.37607, "r_x2": 286.36508, "r_y2": 302.46950999999996, "r_x3": 138.84888, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 323.33105, "r_x1": 286.36505, "r_y1": 323.33105, "r_x2": 286.36505, "r_y2": 314.4245, "r_x3": 50.111992, "r_y3": 314.4245, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 335.28604, "r_x1": 286.36508, "r_y1": 335.28604, "r_x2": 286.36508, "r_y2": 326.37949000000003, "r_x3": 50.111992, "r_y3": 326.37949000000003, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 347.2410300000001, "r_x1": 286.36505, "r_y1": 347.2410300000001, "r_x2": 286.36505, "r_y2": 338.33447, "r_x3": 50.111992, "r_y3": 338.33447, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 359.19601, "r_x1": 286.36505, "r_y1": 359.19601, "r_x2": 286.36505, "r_y2": 350.28946, "r_x3": 50.111992, "r_y3": 350.28946, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 371.15201, "r_x1": 286.36508, "r_y1": 371.15201, "r_x2": 286.36508, "r_y2": 362.24545000000006, "r_x3": 50.111992, "r_y3": 362.24545000000006, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 383.10699, "r_x1": 286.36508, "r_y1": 383.10699, "r_x2": 286.36508, "r_y2": 374.20044, "r_x3": 50.111992, "r_y3": 374.20044, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 395.06198, "r_x1": 286.36508, "r_y1": 395.06198, "r_x2": 286.36508, "r_y2": 386.15542999999997, "r_x3": 50.111992, "r_y3": 386.15542999999997, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 407.01697, "r_x1": 286.36508, "r_y1": 407.01697, "r_x2": 286.36508, "r_y2": 398.11041000000006, "r_x3": 50.111992, "r_y3": 398.11041000000006, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 418.97195, "r_x1": 286.36508, "r_y1": 418.97195, "r_x2": 286.36508, "r_y2": 410.0654, "r_x3": 50.111992, "r_y3": 410.0654, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 430.92694, "r_x1": 286.36505, "r_y1": 430.92694, "r_x2": 286.36505, "r_y2": 422.02038999999996, "r_x3": 50.111992, "r_y3": 422.02038999999996, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 442.88293, "r_x1": 198.2359, "r_y1": 442.88293, "r_x2": 198.2359, "r_y2": 433.97638, "r_x3": 50.111992, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.92703, "r_y0": 442.88293, "r_x1": 286.36505, "r_y1": 442.88293, "r_x2": 286.36505, "r_y2": 433.97638, "r_x3": 205.92703, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 454.83792000000005, "r_x1": 286.36508, "r_y1": 454.83792000000005, "r_x2": 286.36508, "r_y2": 445.93137, "r_x3": 50.111992, "r_y3": 445.93137, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 466.79291, "r_x1": 286.36505, "r_y1": 466.79291, "r_x2": 286.36505, "r_y2": 457.88635, "r_x3": 50.111992, "r_y3": 457.88635, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 478.74789, "r_x1": 286.36505, "r_y1": 478.74789, "r_x2": 286.36505, "r_y2": 469.84134, "r_x3": 50.111992, "r_y3": 469.84134, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 490.70288, "r_x1": 186.49998, "r_y1": 490.70288, "r_x2": 186.49998, "r_y2": 481.79633, "r_x3": 50.111992, "r_y3": 481.79633, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.111984, "t": 493.68875, "r": 286.36627, "b": 622.26685, "coord_origin": "TOPLEFT" }, "confidence": 0.9875094294548035, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066994, "r_y0": 502.64514, "r_x1": 252.88068000000004, "r_y1": 502.64514, "r_x2": 252.88068000000004, "r_y2": 493.68875, "r_x3": 62.066994, "r_y3": 493.68875, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88199, "r_y0": 502.71487, "r_x1": 286.36627, "r_y1": 502.71487, "r_x2": 286.36627, "r_y2": 493.80832, "r_x3": 252.88199, "r_y3": 493.80832, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 514.66986, "r_x1": 286.36505, "r_y1": 514.66986, "r_x2": 286.36505, "r_y2": 505.76331, "r_x3": 50.111984, "r_y3": 505.76331, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 526.6248499999999, "r_x1": 286.36505, "r_y1": 526.6248499999999, "r_x2": 286.36505, "r_y2": 517.71829, "r_x3": 50.111984, "r_y3": 517.71829, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 538.57985, "r_x1": 286.36508, "r_y1": 538.57985, "r_x2": 286.36508, "r_y2": 529.67328, "r_x3": 50.111984, "r_y3": 529.67328, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 550.53584, "r_x1": 286.36508, "r_y1": 550.53584, "r_x2": 286.36508, "r_y2": 541.62929, "r_x3": 50.111984, "r_y3": 541.62929, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 562.4908399999999, "r_x1": 286.36511, "r_y1": 562.4908399999999, "r_x2": 286.36511, "r_y2": 553.58429, "r_x3": 50.111984, "r_y3": 553.58429, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 574.44585, "r_x1": 286.36511, "r_y1": 574.44585, "r_x2": 286.36511, "r_y2": 565.5392899999999, "r_x3": 50.111984, "r_y3": 565.5392899999999, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 586.40085, "r_x1": 286.36502, "r_y1": 586.40085, "r_x2": 286.36502, "r_y2": 577.49429, "r_x3": 50.111984, "r_y3": 577.49429, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 598.35585, "r_x1": 286.36505, "r_y1": 598.35585, "r_x2": 286.36505, "r_y2": 589.4493, "r_x3": 50.111984, "r_y3": 589.4493, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 610.31085, "r_x1": 286.36502, "r_y1": 610.31085, "r_x2": 286.36502, "r_y2": 601.4043, "r_x3": 50.111984, "r_y3": 601.4043, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 622.26685, "r_x1": 175.98943, "r_y1": 622.26685, "r_x2": 175.98943, "r_y2": 613.36029, "r_x3": 50.111984, "r_y3": 613.36029, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "section_header", "bbox": { "l": 50.111984, "t": 635.94484, "r": 105.22546, "b": 646.6925699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9423062205314636, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 646.6925699999999, "r_x1": 57.82375699999999, "r_y1": 646.6925699999999, "r_x2": 57.82375699999999, "r_y2": 635.94484, "r_x3": 50.111984, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.106125, "r_y0": 646.6925699999999, "r_x1": 105.22546, "r_y1": 646.6925699999999, "r_x2": 105.22546, "r_y2": 635.94484, "r_x3": 68.106125, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.111984, "t": 656.42529, "r": 286.36508, "b": 713.151863, "coord_origin": "TOPLEFT" }, "confidence": 0.9862047433853149, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 665.33186, "r_x1": 286.36493, "r_y1": 665.33186, "r_x2": 286.36493, "r_y2": 656.42529, "r_x3": 62.06698600000001, "r_y3": 656.42529, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 677.2868599999999, "r_x1": 286.36508, "r_y1": 677.2868599999999, "r_x2": 286.36508, "r_y2": 668.38029, "r_x3": 50.111984, "r_y3": 668.38029, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 689.24186, "r_x1": 286.36502, "r_y1": 689.24186, "r_x2": 286.36502, "r_y2": 680.3353, "r_x3": 50.111984, "r_y3": 680.3353, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 701.196861, "r_x1": 166.24602, "r_y1": 701.196861, "r_x2": 166.24602, "r_y2": 692.290298, "r_x3": 50.111984, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.68808, "r_y0": 701.196861, "r_x1": 286.36508, "r_y1": 701.196861, "r_x2": 286.36508, "r_y2": 692.290298, "r_x3": 173.68808, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 713.151863, "r_x1": 286.36505, "r_y1": 713.151863, "r_x2": 286.36505, "r_y2": 704.2453, "r_x3": 50.111984, "r_y3": 704.2453, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "picture", "bbox": { "l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT" }, "confidence": 0.9746918082237244, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.79849, "r_y0": 88.55975000000001, "r_x1": 486.84909, "r_y1": 88.55975000000001, "r_x2": 486.84909, "r_y2": 79.81176999999991, "r_x3": 380.79849, "r_y3": 79.81176999999991, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.76776, "r_y0": 250.77495999999996, "r_x1": 469.78748, "r_y1": 250.77495999999996, "r_x2": 469.78748, "r_y2": 242.02697999999998, "r_x3": 396.76776, "r_y3": 242.02697999999998, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.97653, "r_y0": 239.255, "r_x1": 324.79254, "r_y1": 239.255, "r_x2": 324.79254, "r_y2": 233.42296999999996, "r_x3": 320.97653, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.483, "r_y0": 239.255, "r_x1": 418.11319, "r_y1": 239.255, "r_x2": 418.11319, "r_y2": 233.42296999999996, "r_x3": 410.483, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.84949, "r_y0": 239.255, "r_x1": 508.47968000000003, "r_y1": 239.255, "r_x2": 508.47968000000003, "r_y2": 233.42296999999996, "r_x3": 500.84949, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.29999, "r_y0": 239.255, "r_x1": 372.93018, "r_y1": 239.255, "r_x2": 372.93018, "r_y2": 233.42296999999996, "r_x3": 365.29999, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.66626, "r_y0": 239.255, "r_x1": 463.29645, "r_y1": 239.255, "r_x2": 463.29645, "r_y2": 233.42296999999996, "r_x3": 455.66626, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.03528, "r_y0": 239.255, "r_x1": 549.66547, "r_y1": 239.255, "r_x2": 549.66547, "r_y2": 233.42296999999996, "r_x3": 542.03528, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04474, "r_y0": 236.27819999999997, "r_x1": 319.86075, "r_y1": 236.27819999999997, "r_x2": 319.86075, "r_y2": 230.44617000000005, "r_x3": 316.04474, "r_y3": 230.44617000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.62521, "r_y0": 204.52277000000004, "r_x1": 316.44122, "r_y1": 204.52277000000004, "r_x2": 316.44122, "r_y2": 198.69073000000003, "r_x3": 312.62521, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.43942, "r_y0": 204.52277000000004, "r_x1": 320.2554, "r_y1": 204.52277000000004, "r_x2": 320.2554, "r_y2": 198.69073000000003, "r_x3": 316.43942, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.14951, "r_y0": 173.92998999999998, "r_x1": 316.96552, "r_y1": 173.92998999999998, "r_x2": 316.96552, "r_y2": 168.09795999999994, "r_x3": 313.14951, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96371, "r_y0": 173.92998999999998, "r_x1": 320.77969, "r_y1": 173.92998999999998, "r_x2": 320.77969, "r_y2": 168.09795999999994, "r_x3": 316.96371, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.92972, "r_y0": 142.41974000000005, "r_x1": 316.74573, "r_y1": 142.41974000000005, "r_x2": 316.74573, "r_y2": 136.58771000000002, "r_x3": 312.92972, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74393, "r_y0": 142.41974000000005, "r_x1": 320.55991, "r_y1": 142.41974000000005, "r_x2": 320.55991, "r_y2": 136.58771000000002, "r_x3": 316.74393, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 111.43377999999996, "r_x1": 316.29828, "r_y1": 111.43377999999996, "r_x2": 316.29828, "r_y2": 105.60175000000004, "r_x3": 312.48227, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 111.43377999999996, "r_x1": 320.11246, "r_y1": 111.43377999999996, "r_x2": 320.11246, "r_y2": 105.60175000000004, "r_x3": 316.29648, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 218.09124999999995, "r_x1": 316.29828, "r_y1": 218.09124999999995, "r_x2": 316.29828, "r_y2": 212.25922000000003, "r_x3": 312.48227, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 218.09124999999995, "r_x1": 320.11246, "r_y1": 218.09124999999995, "r_x2": 320.11246, "r_y2": 212.25922000000003, "r_x3": 316.29648, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.07639, "r_y0": 189.55402000000004, "r_x1": 316.8924, "r_y1": 189.55402000000004, "r_x2": 316.8924, "r_y2": 183.72198000000003, "r_x3": 313.07639, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89059, "r_y0": 189.55402000000004, "r_x1": 320.70657, "r_y1": 189.55402000000004, "r_x2": 320.70657, "r_y2": 183.72198000000003, "r_x3": 316.89059, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76321, "r_y0": 158.30602999999996, "r_x1": 316.57922, "r_y1": 158.30602999999996, "r_x2": 316.57922, "r_y2": 152.47400000000005, "r_x3": 312.76321, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.57742, "r_y0": 158.30602999999996, "r_x1": 320.3934, "r_y1": 158.30602999999996, "r_x2": 320.3934, "r_y2": 152.47400000000005, "r_x3": 316.57742, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.19775, "r_y0": 126.40252999999996, "r_x1": 316.01376, "r_y1": 126.40252999999996, "r_x2": 316.01376, "r_y2": 120.57050000000004, "r_x3": 312.19775, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01196, "r_y0": 126.40252999999996, "r_x1": 319.82794, "r_y1": 126.40252999999996, "r_x2": 319.82794, "r_y2": 120.57050000000004, "r_x3": 316.01196, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8165, "r_y0": 95.94073000000003, "r_x1": 316.63251, "r_y1": 95.94073000000003, "r_x2": 316.63251, "r_y2": 90.1087, "r_x3": 312.8165, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63071, "r_y0": 95.94073000000003, "r_x1": 320.44669, "r_y1": 95.94073000000003, "r_x2": 320.44669, "r_y2": 90.1087, "r_x3": 316.63071, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17426, "r_y0": 230.01727000000005, "r_x1": 536.94427, "r_y1": 230.01727000000005, "r_x2": 536.94427, "r_y2": 222.72729000000004, "r_x3": 532.17426, "r_y3": 222.72729000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.87952, "r_y0": 115.55700999999999, "r_x1": 547.61249, "r_y1": 115.55700999999999, "r_x2": 547.61249, "r_y2": 108.26702999999986, "r_x3": 532.87952, "r_y3": 108.26702999999986, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.7735, "r_y0": 138.07097999999996, "r_x1": 542.73877, "r_y1": 138.07097999999996, "r_x2": 542.73877, "r_y2": 130.78101000000004, "r_x3": 532.7735, "r_y3": 130.78101000000004, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.79901, "r_y0": 161.21349999999995, "r_x1": 542.76428, "r_y1": 161.21349999999995, "r_x2": 542.76428, "r_y2": 153.92352000000005, "r_x3": 532.79901, "r_y3": 153.92352000000005, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.5705, "r_y0": 184.04796999999996, "r_x1": 542.53577, "r_y1": 184.04796999999996, "r_x2": 542.53577, "r_y2": 176.75800000000004, "r_x3": 532.5705, "r_y3": 176.75800000000004, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.14551, "r_y0": 206.93628, "r_x1": 542.11078, "r_y1": 206.93628, "r_x2": 542.11078, "r_y2": 199.6463, "r_x3": 532.14551, "r_y3": 199.6463, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 12, "label": "section_header", "bbox": { "l": 380.79849, "t": 79.81176999999991, "r": 486.84909, "b": 88.55975000000001, "coord_origin": "TOPLEFT" }, "confidence": 0.5687217116355896, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.79849, "r_y0": 88.55975000000001, "r_x1": 486.84909, "r_y1": 88.55975000000001, "r_x2": 486.84909, "r_y2": 79.81176999999991, "r_x3": 380.79849, "r_y3": 79.81176999999991, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 396.76776, "t": 242.02697999999998, "r": 469.78748, "b": 250.77495999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.76776, "r_y0": 250.77495999999996, "r_x1": 469.78748, "r_y1": 250.77495999999996, "r_x2": 469.78748, "r_y2": 242.02697999999998, "r_x3": 396.76776, "r_y3": 242.02697999999998, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 320.97653, "t": 233.42296999999996, "r": 324.79254, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.97653, "r_y0": 239.255, "r_x1": 324.79254, "r_y1": 239.255, "r_x2": 324.79254, "r_y2": 233.42296999999996, "r_x3": 320.97653, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 410.483, "t": 233.42296999999996, "r": 418.11319, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.483, "r_y0": 239.255, "r_x1": 418.11319, "r_y1": 239.255, "r_x2": 418.11319, "r_y2": 233.42296999999996, "r_x3": 410.483, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 500.84949, "t": 233.42296999999996, "r": 508.47968000000003, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.84949, "r_y0": 239.255, "r_x1": 508.47968000000003, "r_y1": 239.255, "r_x2": 508.47968000000003, "r_y2": 233.42296999999996, "r_x3": 500.84949, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 365.29999, "t": 233.42296999999996, "r": 372.93018, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.29999, "r_y0": 239.255, "r_x1": 372.93018, "r_y1": 239.255, "r_x2": 372.93018, "r_y2": 233.42296999999996, "r_x3": 365.29999, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 455.66626, "t": 233.42296999999996, "r": 463.29645, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.66626, "r_y0": 239.255, "r_x1": 463.29645, "r_y1": 239.255, "r_x2": 463.29645, "r_y2": 233.42296999999996, "r_x3": 455.66626, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 542.03528, "t": 233.42296999999996, "r": 549.66547, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.03528, "r_y0": 239.255, "r_x1": 549.66547, "r_y1": 239.255, "r_x2": 549.66547, "r_y2": 233.42296999999996, "r_x3": 542.03528, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 316.04474, "t": 230.44617000000005, "r": 319.86075, "b": 236.27819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04474, "r_y0": 236.27819999999997, "r_x1": 319.86075, "r_y1": 236.27819999999997, "r_x2": 319.86075, "r_y2": 230.44617000000005, "r_x3": 316.04474, "r_y3": 230.44617000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 312.62521, "t": 198.69073000000003, "r": 316.44122, "b": 204.52277000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.62521, "r_y0": 204.52277000000004, "r_x1": 316.44122, "r_y1": 204.52277000000004, "r_x2": 316.44122, "r_y2": 198.69073000000003, "r_x3": 312.62521, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 316.43942, "t": 198.69073000000003, "r": 320.2554, "b": 204.52277000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.43942, "r_y0": 204.52277000000004, "r_x1": 320.2554, "r_y1": 204.52277000000004, "r_x2": 320.2554, "r_y2": 198.69073000000003, "r_x3": 316.43942, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 313.14951, "t": 168.09795999999994, "r": 316.96552, "b": 173.92998999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.14951, "r_y0": 173.92998999999998, "r_x1": 316.96552, "r_y1": 173.92998999999998, "r_x2": 316.96552, "r_y2": 168.09795999999994, "r_x3": 313.14951, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 316.96371, "t": 168.09795999999994, "r": 320.77969, "b": 173.92998999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96371, "r_y0": 173.92998999999998, "r_x1": 320.77969, "r_y1": 173.92998999999998, "r_x2": 320.77969, "r_y2": 168.09795999999994, "r_x3": 316.96371, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 312.92972, "t": 136.58771000000002, "r": 316.74573, "b": 142.41974000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.92972, "r_y0": 142.41974000000005, "r_x1": 316.74573, "r_y1": 142.41974000000005, "r_x2": 316.74573, "r_y2": 136.58771000000002, "r_x3": 312.92972, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 316.74393, "t": 136.58771000000002, "r": 320.55991, "b": 142.41974000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74393, "r_y0": 142.41974000000005, "r_x1": 320.55991, "r_y1": 142.41974000000005, "r_x2": 320.55991, "r_y2": 136.58771000000002, "r_x3": 316.74393, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 312.48227, "t": 105.60175000000004, "r": 316.29828, "b": 111.43377999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 111.43377999999996, "r_x1": 316.29828, "r_y1": 111.43377999999996, "r_x2": 316.29828, "r_y2": 105.60175000000004, "r_x3": 312.48227, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 316.29648, "t": 105.60175000000004, "r": 320.11246, "b": 111.43377999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 111.43377999999996, "r_x1": 320.11246, "r_y1": 111.43377999999996, "r_x2": 320.11246, "r_y2": 105.60175000000004, "r_x3": 316.29648, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 312.48227, "t": 212.25922000000003, "r": 316.29828, "b": 218.09124999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 218.09124999999995, "r_x1": 316.29828, "r_y1": 218.09124999999995, "r_x2": 316.29828, "r_y2": 212.25922000000003, "r_x3": 312.48227, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 316.29648, "t": 212.25922000000003, "r": 320.11246, "b": 218.09124999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 218.09124999999995, "r_x1": 320.11246, "r_y1": 218.09124999999995, "r_x2": 320.11246, "r_y2": 212.25922000000003, "r_x3": 316.29648, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 313.07639, "t": 183.72198000000003, "r": 316.8924, "b": 189.55402000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.07639, "r_y0": 189.55402000000004, "r_x1": 316.8924, "r_y1": 189.55402000000004, "r_x2": 316.8924, "r_y2": 183.72198000000003, "r_x3": 313.07639, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 316.89059, "t": 183.72198000000003, "r": 320.70657, "b": 189.55402000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89059, "r_y0": 189.55402000000004, "r_x1": 320.70657, "r_y1": 189.55402000000004, "r_x2": 320.70657, "r_y2": 183.72198000000003, "r_x3": 316.89059, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 312.76321, "t": 152.47400000000005, "r": 316.57922, "b": 158.30602999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76321, "r_y0": 158.30602999999996, "r_x1": 316.57922, "r_y1": 158.30602999999996, "r_x2": 316.57922, "r_y2": 152.47400000000005, "r_x3": 312.76321, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 316.57742, "t": 152.47400000000005, "r": 320.3934, "b": 158.30602999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.57742, "r_y0": 158.30602999999996, "r_x1": 320.3934, "r_y1": 158.30602999999996, "r_x2": 320.3934, "r_y2": 152.47400000000005, "r_x3": 316.57742, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 312.19775, "t": 120.57050000000004, "r": 316.01376, "b": 126.40252999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.19775, "r_y0": 126.40252999999996, "r_x1": 316.01376, "r_y1": 126.40252999999996, "r_x2": 316.01376, "r_y2": 120.57050000000004, "r_x3": 312.19775, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 316.01196, "t": 120.57050000000004, "r": 319.82794, "b": 126.40252999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01196, "r_y0": 126.40252999999996, "r_x1": 319.82794, "r_y1": 126.40252999999996, "r_x2": 319.82794, "r_y2": 120.57050000000004, "r_x3": 316.01196, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 312.8165, "t": 90.1087, "r": 316.63251, "b": 95.94073000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8165, "r_y0": 95.94073000000003, "r_x1": 316.63251, "r_y1": 95.94073000000003, "r_x2": 316.63251, "r_y2": 90.1087, "r_x3": 312.8165, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 316.63071, "t": 90.1087, "r": 320.44669, "b": 95.94073000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63071, "r_y0": 95.94073000000003, "r_x1": 320.44669, "r_y1": 95.94073000000003, "r_x2": 320.44669, "r_y2": 90.1087, "r_x3": 316.63071, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 532.17426, "t": 222.72729000000004, "r": 536.94427, "b": 230.01727000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17426, "r_y0": 230.01727000000005, "r_x1": 536.94427, "r_y1": 230.01727000000005, "r_x2": 536.94427, "r_y2": 222.72729000000004, "r_x3": 532.17426, "r_y3": 222.72729000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 532.87952, "t": 108.26702999999986, "r": 547.61249, "b": 115.55700999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.87952, "r_y0": 115.55700999999999, "r_x1": 547.61249, "r_y1": 115.55700999999999, "r_x2": 547.61249, "r_y2": 108.26702999999986, "r_x3": 532.87952, "r_y3": 108.26702999999986, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 532.7735, "t": 130.78101000000004, "r": 542.73877, "b": 138.07097999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.7735, "r_y0": 138.07097999999996, "r_x1": 542.73877, "r_y1": 138.07097999999996, "r_x2": 542.73877, "r_y2": 130.78101000000004, "r_x3": 532.7735, "r_y3": 130.78101000000004, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 532.79901, "t": 153.92352000000005, "r": 542.76428, "b": 161.21349999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.79901, "r_y0": 161.21349999999995, "r_x1": 542.76428, "r_y1": 161.21349999999995, "r_x2": 542.76428, "r_y2": 153.92352000000005, "r_x3": 532.79901, "r_y3": 153.92352000000005, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 532.5705, "t": 176.75800000000004, "r": 542.53577, "b": 184.04796999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.5705, "r_y0": 184.04796999999996, "r_x1": 542.53577, "r_y1": 184.04796999999996, "r_x2": 542.53577, "r_y2": 176.75800000000004, "r_x3": 532.5705, "r_y3": 176.75800000000004, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 532.14551, "t": 199.6463, "r": 542.11078, "b": 206.93628, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.14551, "r_y0": 206.93628, "r_x1": 542.11078, "r_y1": 206.93628, "r_x2": 542.11078, "r_y2": 199.6463, "r_x3": 532.14551, "r_y3": 199.6463, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 7, "label": "caption", "bbox": { "l": 308.862, "t": 267.83636, "r": 545.11511, "b": 288.6979099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9667505025863647, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 276.74292, "r_x1": 346.06238, "r_y1": 276.74292, "r_x2": 346.06238, "r_y2": 267.83636, "r_x3": 308.862, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49072, "r_y0": 276.74292, "r_x1": 545.11511, "r_y1": 276.74292, "r_x2": 545.11511, "r_y2": 267.83636, "r_x3": 354.49072, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 288.6979099999999, "r_x1": 498.56989, "r_y1": 288.6979099999999, "r_x2": 498.56989, "r_y2": 279.79132000000004, "r_x3": 308.862, "r_y3": 279.79132000000004, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 308.862, "t": 317.47336, "r": 437.27002, "b": 326.37991, "coord_origin": "TOPLEFT" }, "confidence": 0.8879811763763428, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 326.37991, "r_x1": 437.27002, "r_y1": 326.37991, "r_x2": 437.27002, "r_y2": 317.47336, "r_x3": 308.862, "r_y3": 317.47336, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.862, "t": 331.53137, "r": 545.11517, "b": 627.36174, "coord_origin": "TOPLEFT" }, "confidence": 0.9870319366455078, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 340.43793, "r_x1": 545.11505, "r_y1": 340.43793, "r_x2": 545.11505, "r_y2": 331.53137, "r_x3": 320.81699, "r_y3": 331.53137, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 352.39291, "r_x1": 545.11517, "r_y1": 352.39291, "r_x2": 545.11517, "r_y2": 343.48635999999993, "r_x3": 308.862, "r_y3": 343.48635999999993, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 364.34890999999993, "r_x1": 545.11505, "r_y1": 364.34890999999993, "r_x2": 545.11505, "r_y2": 355.44235, "r_x3": 308.862, "r_y3": 355.44235, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 376.30389, "r_x1": 545.11505, "r_y1": 376.30389, "r_x2": 545.11505, "r_y2": 367.39734, "r_x3": 308.862, "r_y3": 367.39734, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 388.25888, "r_x1": 545.11511, "r_y1": 388.25888, "r_x2": 545.11511, "r_y2": 379.35233, "r_x3": 308.862, "r_y3": 379.35233, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.21386999999993, "r_x1": 545.11511, "r_y1": 400.21386999999993, "r_x2": 545.11511, "r_y2": 391.30731, "r_x3": 308.862, "r_y3": 391.30731, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.16885, "r_x1": 545.11505, "r_y1": 412.16885, "r_x2": 545.11505, "r_y2": 403.26230000000004, "r_x3": 308.862, "r_y3": 403.26230000000004, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.12384, "r_x1": 545.11511, "r_y1": 424.12384, "r_x2": 545.11511, "r_y2": 415.21729, "r_x3": 308.862, "r_y3": 415.21729, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.0798300000001, "r_x1": 545.11517, "r_y1": 436.0798300000001, "r_x2": 545.11517, "r_y2": 427.17328, "r_x3": 308.862, "r_y3": 427.17328, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.03482, "r_x1": 545.11517, "r_y1": 448.03482, "r_x2": 545.11517, "r_y2": 439.12827, "r_x3": 308.862, "r_y3": 439.12827, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 459.98981000000003, "r_x1": 545.11511, "r_y1": 459.98981000000003, "r_x2": 545.11511, "r_y2": 451.08325, "r_x3": 308.862, "r_y3": 451.08325, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 471.94479, "r_x1": 545.11505, "r_y1": 471.94479, "r_x2": 545.11505, "r_y2": 463.03824, "r_x3": 308.862, "r_y3": 463.03824, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 483.89978, "r_x1": 545.11511, "r_y1": 483.89978, "r_x2": 545.11511, "r_y2": 474.99323, "r_x3": 308.862, "r_y3": 474.99323, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 495.85577, "r_x1": 545.11511, "r_y1": 495.85577, "r_x2": 545.11511, "r_y2": 486.94922, "r_x3": 308.862, "r_y3": 486.94922, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 507.81076, "r_x1": 545.11511, "r_y1": 507.81076, "r_x2": 545.11511, "r_y2": 498.90421, "r_x3": 308.862, "r_y3": 498.90421, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 519.76575, "r_x1": 545.11517, "r_y1": 519.76575, "r_x2": 545.11517, "r_y2": 510.85919, "r_x3": 308.862, "r_y3": 510.85919, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 531.72073, "r_x1": 545.11517, "r_y1": 531.72073, "r_x2": 545.11517, "r_y2": 522.8141800000001, "r_x3": 308.862, "r_y3": 522.8141800000001, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 543.67574, "r_x1": 545.11505, "r_y1": 543.67574, "r_x2": 545.11505, "r_y2": 534.76917, "r_x3": 308.862, "r_y3": 534.76917, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 555.6307400000001, "r_x1": 545.11511, "r_y1": 555.6307400000001, "r_x2": 545.11511, "r_y2": 546.72418, "r_x3": 308.862, "r_y3": 546.72418, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 567.58673, "r_x1": 545.11511, "r_y1": 567.58673, "r_x2": 545.11511, "r_y2": 558.6801800000001, "r_x3": 308.862, "r_y3": 558.6801800000001, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 579.54173, "r_x1": 545.11505, "r_y1": 579.54173, "r_x2": 545.11505, "r_y2": 570.63518, "r_x3": 308.862, "r_y3": 570.63518, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 591.49673, "r_x1": 545.11499, "r_y1": 591.49673, "r_x2": 545.11499, "r_y2": 582.59018, "r_x3": 308.862, "r_y3": 582.59018, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 603.45174, "r_x1": 545.11517, "r_y1": 603.45174, "r_x2": 545.11517, "r_y2": 594.54518, "r_x3": 308.862, "r_y3": 594.54518, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 615.40674, "r_x1": 545.11511, "r_y1": 615.40674, "r_x2": 545.11511, "r_y2": 606.50018, "r_x3": 308.862, "r_y3": 606.50018, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 627.36174, "r_x1": 348.16446, "r_y1": 627.36174, "r_x2": 348.16446, "r_y2": 618.45518, "r_x3": 308.862, "r_y3": 618.45518, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 308.862, "t": 632.51419, "r": 545.11511, "b": 713.151764, "coord_origin": "TOPLEFT" }, "confidence": 0.9840091466903687, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 641.42075, "r_x1": 545.11487, "r_y1": 641.42075, "r_x2": 545.11487, "r_y2": 632.51419, "r_x3": 320.81699, "r_y3": 632.51419, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.37575, "r_x1": 545.11511, "r_y1": 653.37575, "r_x2": 545.11511, "r_y2": 644.46919, "r_x3": 308.862, "r_y3": 644.46919, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.33076, "r_x1": 545.11511, "r_y1": 665.33076, "r_x2": 545.11511, "r_y2": 656.42419, "r_x3": 308.862, "r_y3": 656.42419, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28676, "r_x1": 545.11499, "r_y1": 677.28676, "r_x2": 545.11499, "r_y2": 668.38019, "r_x3": 308.862, "r_y3": 668.38019, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24176, "r_x1": 545.11505, "r_y1": 689.24176, "r_x2": 545.11505, "r_y2": 680.33519, "r_x3": 308.862, "r_y3": 680.33519, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196762, "r_x1": 545.11505, "r_y1": 701.196762, "r_x2": 545.11505, "r_y2": 692.290192, "r_x3": 308.862, "r_y3": 692.290192, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151764, "r_x1": 545.11511, "r_y1": 713.151764, "r_x2": 545.11511, "r_y2": 704.245193, "r_x3": 308.862, "r_y3": 704.245193, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133198, "r": 300.10229, "b": 743.039761, "coord_origin": "TOPLEFT" }, "confidence": 0.8715606927871704, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039761, "r_x1": 300.10229, "r_y1": 743.039761, "r_x2": 300.10229, "r_y2": 734.133198, "r_x3": 295.121, "r_y3": 734.133198, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 10, "page_no": 2, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 250.15102, "b": 84.11492999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.8767216801643372, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 250.15102, "r_y1": 84.11492999999996, "r_x2": 250.15102, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tag-decoder which is constrained to the table-tags." }, { "label": "text", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.112, "t": 87.21935999999994, "r": 286.36514, "b": 275.45410000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9822593927383423, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.12591999999995, "r_x1": 70.365845, "r_y1": 96.12591999999995, "r_x2": 70.365845, "r_y2": 87.21935999999994, "r_x3": 62.067001, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.931198, "r_y0": 96.12591999999995, "r_x1": 110.95348000000001, "r_y1": 96.12591999999995, "r_x2": 110.95348000000001, "r_y2": 87.21935999999994, "r_x3": 76.931198, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54498, "r_y0": 96.12591999999995, "r_x1": 136.25848, "r_y1": 96.12591999999995, "r_x2": 136.25848, "r_y2": 87.21935999999994, "r_x3": 118.54498, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82384, "r_y0": 96.12591999999995, "r_x1": 175.37166, "r_y1": 96.12591999999995, "r_x2": 175.37166, "r_y2": 87.21935999999994, "r_x3": 142.82384, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.94698, "r_y0": 96.12591999999995, "r_x1": 232.83594000000002, "r_y1": 96.12591999999995, "r_x2": 232.83594000000002, "r_y2": 87.21935999999994, "r_x3": 181.94698, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41125, "r_y0": 96.12591999999995, "r_x1": 265.41364, "r_y1": 96.12591999999995, "r_x2": 265.41364, "r_y2": 87.21935999999994, "r_x3": 239.41125, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.979, "r_y0": 96.12591999999995, "r_x1": 286.36499, "r_y1": 96.12591999999995, "r_x2": 286.36499, "r_y2": 87.21935999999994, "r_x3": 271.979, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.08092999999997, "r_x1": 286.36505, "r_y1": 108.08092999999997, "r_x2": 286.36505, "r_y2": 99.17437999999993, "r_x3": 50.112, "r_y3": 99.17437999999993, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.03692999999998, "r_x1": 286.36511, "r_y1": 120.03692999999998, "r_x2": 286.36511, "r_y2": 111.13036999999997, "r_x3": 50.112, "r_y3": 111.13036999999997, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.99194, "r_x1": 286.36505, "r_y1": 131.99194, "r_x2": 286.36505, "r_y2": 123.08538999999996, "r_x3": 50.112, "r_y3": 123.08538999999996, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.94696, "r_x1": 286.36514, "r_y1": 143.94696, "r_x2": 286.36514, "r_y2": 135.04040999999995, "r_x3": 50.112, "r_y3": 135.04040999999995, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.90197999999998, "r_x1": 286.36511, "r_y1": 155.90197999999998, "r_x2": 286.36511, "r_y2": 146.99541999999997, "r_x3": 50.112, "r_y3": 146.99541999999997, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 167.85699, "r_x1": 286.36505, "r_y1": 167.85699, "r_x2": 286.36505, "r_y2": 158.95043999999996, "r_x3": 50.112, "r_y3": 158.95043999999996, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 179.81201, "r_x1": 286.36508, "r_y1": 179.81201, "r_x2": 286.36508, "r_y2": 170.90545999999995, "r_x3": 50.112, "r_y3": 170.90545999999995, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 191.76801, "r_x1": 286.36508, "r_y1": 191.76801, "r_x2": 286.36508, "r_y2": 182.86145, "r_x3": 50.112, "r_y3": 182.86145, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 203.72302000000002, "r_x1": 286.36511, "r_y1": 203.72302000000002, "r_x2": 286.36511, "r_y2": 194.81646999999998, "r_x3": 50.112, "r_y3": 194.81646999999998, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 215.67804, "r_x1": 286.36511, "r_y1": 215.67804, "r_x2": 286.36511, "r_y2": 206.77148, "r_x3": 50.112, "r_y3": 206.77148, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 227.63306, "r_x1": 286.36505, "r_y1": 227.63306, "r_x2": 286.36505, "r_y2": 218.7265, "r_x3": 50.112, "r_y3": 218.7265, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 239.58807000000002, "r_x1": 286.36505, "r_y1": 239.58807000000002, "r_x2": 286.36505, "r_y2": 230.68151999999998, "r_x3": 50.112, "r_y3": 230.68151999999998, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 251.54309, "r_x1": 286.36511, "r_y1": 251.54309, "r_x2": 286.36511, "r_y2": 242.63653999999997, "r_x3": 50.112, "r_y3": 242.63653999999997, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 263.49908000000005, "r_x1": 286.36508, "r_y1": 263.49908000000005, "r_x2": 286.36508, "r_y2": 254.59253, "r_x3": 50.112, "r_y3": 254.59253, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 275.45410000000004, "r_x1": 64.776947, "r_y1": 275.45410000000004, "r_x2": 64.776947, "r_y2": 266.54755, "r_x3": 50.112, "r_y3": 266.54755, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.111992, "t": 278.43895999999995, "r": 286.36511, "b": 490.70288, "coord_origin": "TOPLEFT" }, "confidence": 0.9878450036048889, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 287.39536, "r_x1": 171.56593, "r_y1": 287.39536, "r_x2": 171.56593, "r_y2": 278.43895999999995, "r_x3": 62.067001, "r_y3": 278.43895999999995, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.56799, "r_y0": 287.46509, "r_x1": 174.3376, "r_y1": 287.46509, "r_x2": 174.3376, "r_y2": 278.55853, "r_x3": 171.56799, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.18687, "r_y0": 287.46509, "r_x1": 286.35709, "r_y1": 287.46509, "r_x2": 286.35709, "r_y2": 278.55853, "r_x3": 185.18687, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 299.42108, "r_x1": 286.36511, "r_y1": 299.42108, "r_x2": 286.36511, "r_y2": 290.51453000000004, "r_x3": 50.111992, "r_y3": 290.51453000000004, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 311.37607, "r_x1": 131.16771, "r_y1": 311.37607, "r_x2": 131.16771, "r_y2": 302.46950999999996, "r_x3": 50.111992, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.84888, "r_y0": 311.37607, "r_x1": 286.36508, "r_y1": 311.37607, "r_x2": 286.36508, "r_y2": 302.46950999999996, "r_x3": 138.84888, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 323.33105, "r_x1": 286.36505, "r_y1": 323.33105, "r_x2": 286.36505, "r_y2": 314.4245, "r_x3": 50.111992, "r_y3": 314.4245, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 335.28604, "r_x1": 286.36508, "r_y1": 335.28604, "r_x2": 286.36508, "r_y2": 326.37949000000003, "r_x3": 50.111992, "r_y3": 326.37949000000003, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 347.2410300000001, "r_x1": 286.36505, "r_y1": 347.2410300000001, "r_x2": 286.36505, "r_y2": 338.33447, "r_x3": 50.111992, "r_y3": 338.33447, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 359.19601, "r_x1": 286.36505, "r_y1": 359.19601, "r_x2": 286.36505, "r_y2": 350.28946, "r_x3": 50.111992, "r_y3": 350.28946, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 371.15201, "r_x1": 286.36508, "r_y1": 371.15201, "r_x2": 286.36508, "r_y2": 362.24545000000006, "r_x3": 50.111992, "r_y3": 362.24545000000006, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 383.10699, "r_x1": 286.36508, "r_y1": 383.10699, "r_x2": 286.36508, "r_y2": 374.20044, "r_x3": 50.111992, "r_y3": 374.20044, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 395.06198, "r_x1": 286.36508, "r_y1": 395.06198, "r_x2": 286.36508, "r_y2": 386.15542999999997, "r_x3": 50.111992, "r_y3": 386.15542999999997, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 407.01697, "r_x1": 286.36508, "r_y1": 407.01697, "r_x2": 286.36508, "r_y2": 398.11041000000006, "r_x3": 50.111992, "r_y3": 398.11041000000006, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 418.97195, "r_x1": 286.36508, "r_y1": 418.97195, "r_x2": 286.36508, "r_y2": 410.0654, "r_x3": 50.111992, "r_y3": 410.0654, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 430.92694, "r_x1": 286.36505, "r_y1": 430.92694, "r_x2": 286.36505, "r_y2": 422.02038999999996, "r_x3": 50.111992, "r_y3": 422.02038999999996, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 442.88293, "r_x1": 198.2359, "r_y1": 442.88293, "r_x2": 198.2359, "r_y2": 433.97638, "r_x3": 50.111992, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.92703, "r_y0": 442.88293, "r_x1": 286.36505, "r_y1": 442.88293, "r_x2": 286.36505, "r_y2": 433.97638, "r_x3": 205.92703, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 454.83792000000005, "r_x1": 286.36508, "r_y1": 454.83792000000005, "r_x2": 286.36508, "r_y2": 445.93137, "r_x3": 50.111992, "r_y3": 445.93137, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 466.79291, "r_x1": 286.36505, "r_y1": 466.79291, "r_x2": 286.36505, "r_y2": 457.88635, "r_x3": 50.111992, "r_y3": 457.88635, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 478.74789, "r_x1": 286.36505, "r_y1": 478.74789, "r_x2": 286.36505, "r_y2": 469.84134, "r_x3": 50.111992, "r_y3": 469.84134, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 490.70288, "r_x1": 186.49998, "r_y1": 490.70288, "r_x2": 186.49998, "r_y2": 481.79633, "r_x3": 50.111992, "r_y3": 481.79633, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.111984, "t": 493.68875, "r": 286.36627, "b": 622.26685, "coord_origin": "TOPLEFT" }, "confidence": 0.9875094294548035, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066994, "r_y0": 502.64514, "r_x1": 252.88068000000004, "r_y1": 502.64514, "r_x2": 252.88068000000004, "r_y2": 493.68875, "r_x3": 62.066994, "r_y3": 493.68875, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88199, "r_y0": 502.71487, "r_x1": 286.36627, "r_y1": 502.71487, "r_x2": 286.36627, "r_y2": 493.80832, "r_x3": 252.88199, "r_y3": 493.80832, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 514.66986, "r_x1": 286.36505, "r_y1": 514.66986, "r_x2": 286.36505, "r_y2": 505.76331, "r_x3": 50.111984, "r_y3": 505.76331, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 526.6248499999999, "r_x1": 286.36505, "r_y1": 526.6248499999999, "r_x2": 286.36505, "r_y2": 517.71829, "r_x3": 50.111984, "r_y3": 517.71829, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 538.57985, "r_x1": 286.36508, "r_y1": 538.57985, "r_x2": 286.36508, "r_y2": 529.67328, "r_x3": 50.111984, "r_y3": 529.67328, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 550.53584, "r_x1": 286.36508, "r_y1": 550.53584, "r_x2": 286.36508, "r_y2": 541.62929, "r_x3": 50.111984, "r_y3": 541.62929, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 562.4908399999999, "r_x1": 286.36511, "r_y1": 562.4908399999999, "r_x2": 286.36511, "r_y2": 553.58429, "r_x3": 50.111984, "r_y3": 553.58429, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 574.44585, "r_x1": 286.36511, "r_y1": 574.44585, "r_x2": 286.36511, "r_y2": 565.5392899999999, "r_x3": 50.111984, "r_y3": 565.5392899999999, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 586.40085, "r_x1": 286.36502, "r_y1": 586.40085, "r_x2": 286.36502, "r_y2": 577.49429, "r_x3": 50.111984, "r_y3": 577.49429, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 598.35585, "r_x1": 286.36505, "r_y1": 598.35585, "r_x2": 286.36505, "r_y2": 589.4493, "r_x3": 50.111984, "r_y3": 589.4493, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 610.31085, "r_x1": 286.36502, "r_y1": 610.31085, "r_x2": 286.36502, "r_y2": 601.4043, "r_x3": 50.111984, "r_y3": 601.4043, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 622.26685, "r_x1": 175.98943, "r_y1": 622.26685, "r_x2": 175.98943, "r_y2": 613.36029, "r_x3": 50.111984, "r_y3": 613.36029, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered." }, { "label": "section_header", "id": 8, "page_no": 2, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 50.111984, "t": 635.94484, "r": 105.22546, "b": 646.6925699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9423062205314636, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 646.6925699999999, "r_x1": 57.82375699999999, "r_y1": 646.6925699999999, "r_x2": 57.82375699999999, "r_y2": 635.94484, "r_x3": 50.111984, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.106125, "r_y0": 646.6925699999999, "r_x1": 105.22546, "r_y1": 646.6925699999999, "r_x2": 105.22546, "r_y2": 635.94484, "r_x3": 68.106125, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Datasets" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.111984, "t": 656.42529, "r": 286.36508, "b": 713.151863, "coord_origin": "TOPLEFT" }, "confidence": 0.9862047433853149, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 665.33186, "r_x1": 286.36493, "r_y1": 665.33186, "r_x2": 286.36493, "r_y2": 656.42529, "r_x3": 62.06698600000001, "r_y3": 656.42529, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 677.2868599999999, "r_x1": 286.36508, "r_y1": 677.2868599999999, "r_x2": 286.36508, "r_y2": 668.38029, "r_x3": 50.111984, "r_y3": 668.38029, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 689.24186, "r_x1": 286.36502, "r_y1": 689.24186, "r_x2": 286.36502, "r_y2": 680.3353, "r_x3": 50.111984, "r_y3": 680.3353, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 701.196861, "r_x1": 166.24602, "r_y1": 701.196861, "r_x2": 166.24602, "r_y2": 692.290298, "r_x3": 50.111984, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.68808, "r_y0": 701.196861, "r_x1": 286.36508, "r_y1": 701.196861, "r_x2": 286.36508, "r_y2": 692.290298, "r_x3": 173.68808, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 713.151863, "r_x1": 286.36505, "r_y1": 713.151863, "r_x2": 286.36505, "r_y2": 704.2453, "r_x3": 50.111984, "r_y3": 704.2453, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-" }, { "label": "picture", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT" }, "confidence": 0.9746918082237244, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.79849, "r_y0": 88.55975000000001, "r_x1": 486.84909, "r_y1": 88.55975000000001, "r_x2": 486.84909, "r_y2": 79.81176999999991, "r_x3": 380.79849, "r_y3": 79.81176999999991, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.76776, "r_y0": 250.77495999999996, "r_x1": 469.78748, "r_y1": 250.77495999999996, "r_x2": 469.78748, "r_y2": 242.02697999999998, "r_x3": 396.76776, "r_y3": 242.02697999999998, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.97653, "r_y0": 239.255, "r_x1": 324.79254, "r_y1": 239.255, "r_x2": 324.79254, "r_y2": 233.42296999999996, "r_x3": 320.97653, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.483, "r_y0": 239.255, "r_x1": 418.11319, "r_y1": 239.255, "r_x2": 418.11319, "r_y2": 233.42296999999996, "r_x3": 410.483, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.84949, "r_y0": 239.255, "r_x1": 508.47968000000003, "r_y1": 239.255, "r_x2": 508.47968000000003, "r_y2": 233.42296999999996, "r_x3": 500.84949, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.29999, "r_y0": 239.255, "r_x1": 372.93018, "r_y1": 239.255, "r_x2": 372.93018, "r_y2": 233.42296999999996, "r_x3": 365.29999, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.66626, "r_y0": 239.255, "r_x1": 463.29645, "r_y1": 239.255, "r_x2": 463.29645, "r_y2": 233.42296999999996, "r_x3": 455.66626, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.03528, "r_y0": 239.255, "r_x1": 549.66547, "r_y1": 239.255, "r_x2": 549.66547, "r_y2": 233.42296999999996, "r_x3": 542.03528, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04474, "r_y0": 236.27819999999997, "r_x1": 319.86075, "r_y1": 236.27819999999997, "r_x2": 319.86075, "r_y2": 230.44617000000005, "r_x3": 316.04474, "r_y3": 230.44617000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.62521, "r_y0": 204.52277000000004, "r_x1": 316.44122, "r_y1": 204.52277000000004, "r_x2": 316.44122, "r_y2": 198.69073000000003, "r_x3": 312.62521, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.43942, "r_y0": 204.52277000000004, "r_x1": 320.2554, "r_y1": 204.52277000000004, "r_x2": 320.2554, "r_y2": 198.69073000000003, "r_x3": 316.43942, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.14951, "r_y0": 173.92998999999998, "r_x1": 316.96552, "r_y1": 173.92998999999998, "r_x2": 316.96552, "r_y2": 168.09795999999994, "r_x3": 313.14951, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96371, "r_y0": 173.92998999999998, "r_x1": 320.77969, "r_y1": 173.92998999999998, "r_x2": 320.77969, "r_y2": 168.09795999999994, "r_x3": 316.96371, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.92972, "r_y0": 142.41974000000005, "r_x1": 316.74573, "r_y1": 142.41974000000005, "r_x2": 316.74573, "r_y2": 136.58771000000002, "r_x3": 312.92972, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74393, "r_y0": 142.41974000000005, "r_x1": 320.55991, "r_y1": 142.41974000000005, "r_x2": 320.55991, "r_y2": 136.58771000000002, "r_x3": 316.74393, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 111.43377999999996, "r_x1": 316.29828, "r_y1": 111.43377999999996, "r_x2": 316.29828, "r_y2": 105.60175000000004, "r_x3": 312.48227, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 111.43377999999996, "r_x1": 320.11246, "r_y1": 111.43377999999996, "r_x2": 320.11246, "r_y2": 105.60175000000004, "r_x3": 316.29648, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 218.09124999999995, "r_x1": 316.29828, "r_y1": 218.09124999999995, "r_x2": 316.29828, "r_y2": 212.25922000000003, "r_x3": 312.48227, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 218.09124999999995, "r_x1": 320.11246, "r_y1": 218.09124999999995, "r_x2": 320.11246, "r_y2": 212.25922000000003, "r_x3": 316.29648, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.07639, "r_y0": 189.55402000000004, "r_x1": 316.8924, "r_y1": 189.55402000000004, "r_x2": 316.8924, "r_y2": 183.72198000000003, "r_x3": 313.07639, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89059, "r_y0": 189.55402000000004, "r_x1": 320.70657, "r_y1": 189.55402000000004, "r_x2": 320.70657, "r_y2": 183.72198000000003, "r_x3": 316.89059, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76321, "r_y0": 158.30602999999996, "r_x1": 316.57922, "r_y1": 158.30602999999996, "r_x2": 316.57922, "r_y2": 152.47400000000005, "r_x3": 312.76321, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.57742, "r_y0": 158.30602999999996, "r_x1": 320.3934, "r_y1": 158.30602999999996, "r_x2": 320.3934, "r_y2": 152.47400000000005, "r_x3": 316.57742, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.19775, "r_y0": 126.40252999999996, "r_x1": 316.01376, "r_y1": 126.40252999999996, "r_x2": 316.01376, "r_y2": 120.57050000000004, "r_x3": 312.19775, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01196, "r_y0": 126.40252999999996, "r_x1": 319.82794, "r_y1": 126.40252999999996, "r_x2": 319.82794, "r_y2": 120.57050000000004, "r_x3": 316.01196, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8165, "r_y0": 95.94073000000003, "r_x1": 316.63251, "r_y1": 95.94073000000003, "r_x2": 316.63251, "r_y2": 90.1087, "r_x3": 312.8165, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63071, "r_y0": 95.94073000000003, "r_x1": 320.44669, "r_y1": 95.94073000000003, "r_x2": 320.44669, "r_y2": 90.1087, "r_x3": 316.63071, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17426, "r_y0": 230.01727000000005, "r_x1": 536.94427, "r_y1": 230.01727000000005, "r_x2": 536.94427, "r_y2": 222.72729000000004, "r_x3": 532.17426, "r_y3": 222.72729000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.87952, "r_y0": 115.55700999999999, "r_x1": 547.61249, "r_y1": 115.55700999999999, "r_x2": 547.61249, "r_y2": 108.26702999999986, "r_x3": 532.87952, "r_y3": 108.26702999999986, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.7735, "r_y0": 138.07097999999996, "r_x1": 542.73877, "r_y1": 138.07097999999996, "r_x2": 542.73877, "r_y2": 130.78101000000004, "r_x3": 532.7735, "r_y3": 130.78101000000004, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.79901, "r_y0": 161.21349999999995, "r_x1": 542.76428, "r_y1": 161.21349999999995, "r_x2": 542.76428, "r_y2": 153.92352000000005, "r_x3": 532.79901, "r_y3": 153.92352000000005, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.5705, "r_y0": 184.04796999999996, "r_x1": 542.53577, "r_y1": 184.04796999999996, "r_x2": 542.53577, "r_y2": 176.75800000000004, "r_x3": 532.5705, "r_y3": 176.75800000000004, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.14551, "r_y0": 206.93628, "r_x1": 542.11078, "r_y1": 206.93628, "r_x2": 542.11078, "r_y2": 199.6463, "r_x3": 532.14551, "r_y3": 199.6463, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 12, "label": "section_header", "bbox": { "l": 380.79849, "t": 79.81176999999991, "r": 486.84909, "b": 88.55975000000001, "coord_origin": "TOPLEFT" }, "confidence": 0.5687217116355896, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.79849, "r_y0": 88.55975000000001, "r_x1": 486.84909, "r_y1": 88.55975000000001, "r_x2": 486.84909, "r_y2": 79.81176999999991, "r_x3": 380.79849, "r_y3": 79.81176999999991, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 396.76776, "t": 242.02697999999998, "r": 469.78748, "b": 250.77495999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.76776, "r_y0": 250.77495999999996, "r_x1": 469.78748, "r_y1": 250.77495999999996, "r_x2": 469.78748, "r_y2": 242.02697999999998, "r_x3": 396.76776, "r_y3": 242.02697999999998, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 320.97653, "t": 233.42296999999996, "r": 324.79254, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.97653, "r_y0": 239.255, "r_x1": 324.79254, "r_y1": 239.255, "r_x2": 324.79254, "r_y2": 233.42296999999996, "r_x3": 320.97653, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 410.483, "t": 233.42296999999996, "r": 418.11319, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.483, "r_y0": 239.255, "r_x1": 418.11319, "r_y1": 239.255, "r_x2": 418.11319, "r_y2": 233.42296999999996, "r_x3": 410.483, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 500.84949, "t": 233.42296999999996, "r": 508.47968000000003, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.84949, "r_y0": 239.255, "r_x1": 508.47968000000003, "r_y1": 239.255, "r_x2": 508.47968000000003, "r_y2": 233.42296999999996, "r_x3": 500.84949, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 365.29999, "t": 233.42296999999996, "r": 372.93018, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.29999, "r_y0": 239.255, "r_x1": 372.93018, "r_y1": 239.255, "r_x2": 372.93018, "r_y2": 233.42296999999996, "r_x3": 365.29999, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 455.66626, "t": 233.42296999999996, "r": 463.29645, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.66626, "r_y0": 239.255, "r_x1": 463.29645, "r_y1": 239.255, "r_x2": 463.29645, "r_y2": 233.42296999999996, "r_x3": 455.66626, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 542.03528, "t": 233.42296999999996, "r": 549.66547, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.03528, "r_y0": 239.255, "r_x1": 549.66547, "r_y1": 239.255, "r_x2": 549.66547, "r_y2": 233.42296999999996, "r_x3": 542.03528, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 316.04474, "t": 230.44617000000005, "r": 319.86075, "b": 236.27819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04474, "r_y0": 236.27819999999997, "r_x1": 319.86075, "r_y1": 236.27819999999997, "r_x2": 319.86075, "r_y2": 230.44617000000005, "r_x3": 316.04474, "r_y3": 230.44617000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 312.62521, "t": 198.69073000000003, "r": 316.44122, "b": 204.52277000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.62521, "r_y0": 204.52277000000004, "r_x1": 316.44122, "r_y1": 204.52277000000004, "r_x2": 316.44122, "r_y2": 198.69073000000003, "r_x3": 312.62521, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 316.43942, "t": 198.69073000000003, "r": 320.2554, "b": 204.52277000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.43942, "r_y0": 204.52277000000004, "r_x1": 320.2554, "r_y1": 204.52277000000004, "r_x2": 320.2554, "r_y2": 198.69073000000003, "r_x3": 316.43942, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 313.14951, "t": 168.09795999999994, "r": 316.96552, "b": 173.92998999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.14951, "r_y0": 173.92998999999998, "r_x1": 316.96552, "r_y1": 173.92998999999998, "r_x2": 316.96552, "r_y2": 168.09795999999994, "r_x3": 313.14951, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 316.96371, "t": 168.09795999999994, "r": 320.77969, "b": 173.92998999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96371, "r_y0": 173.92998999999998, "r_x1": 320.77969, "r_y1": 173.92998999999998, "r_x2": 320.77969, "r_y2": 168.09795999999994, "r_x3": 316.96371, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 312.92972, "t": 136.58771000000002, "r": 316.74573, "b": 142.41974000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.92972, "r_y0": 142.41974000000005, "r_x1": 316.74573, "r_y1": 142.41974000000005, "r_x2": 316.74573, "r_y2": 136.58771000000002, "r_x3": 312.92972, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 316.74393, "t": 136.58771000000002, "r": 320.55991, "b": 142.41974000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74393, "r_y0": 142.41974000000005, "r_x1": 320.55991, "r_y1": 142.41974000000005, "r_x2": 320.55991, "r_y2": 136.58771000000002, "r_x3": 316.74393, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 312.48227, "t": 105.60175000000004, "r": 316.29828, "b": 111.43377999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 111.43377999999996, "r_x1": 316.29828, "r_y1": 111.43377999999996, "r_x2": 316.29828, "r_y2": 105.60175000000004, "r_x3": 312.48227, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 316.29648, "t": 105.60175000000004, "r": 320.11246, "b": 111.43377999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 111.43377999999996, "r_x1": 320.11246, "r_y1": 111.43377999999996, "r_x2": 320.11246, "r_y2": 105.60175000000004, "r_x3": 316.29648, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 312.48227, "t": 212.25922000000003, "r": 316.29828, "b": 218.09124999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 218.09124999999995, "r_x1": 316.29828, "r_y1": 218.09124999999995, "r_x2": 316.29828, "r_y2": 212.25922000000003, "r_x3": 312.48227, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 316.29648, "t": 212.25922000000003, "r": 320.11246, "b": 218.09124999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 218.09124999999995, "r_x1": 320.11246, "r_y1": 218.09124999999995, "r_x2": 320.11246, "r_y2": 212.25922000000003, "r_x3": 316.29648, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 313.07639, "t": 183.72198000000003, "r": 316.8924, "b": 189.55402000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.07639, "r_y0": 189.55402000000004, "r_x1": 316.8924, "r_y1": 189.55402000000004, "r_x2": 316.8924, "r_y2": 183.72198000000003, "r_x3": 313.07639, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 316.89059, "t": 183.72198000000003, "r": 320.70657, "b": 189.55402000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89059, "r_y0": 189.55402000000004, "r_x1": 320.70657, "r_y1": 189.55402000000004, "r_x2": 320.70657, "r_y2": 183.72198000000003, "r_x3": 316.89059, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 312.76321, "t": 152.47400000000005, "r": 316.57922, "b": 158.30602999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76321, "r_y0": 158.30602999999996, "r_x1": 316.57922, "r_y1": 158.30602999999996, "r_x2": 316.57922, "r_y2": 152.47400000000005, "r_x3": 312.76321, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 316.57742, "t": 152.47400000000005, "r": 320.3934, "b": 158.30602999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.57742, "r_y0": 158.30602999999996, "r_x1": 320.3934, "r_y1": 158.30602999999996, "r_x2": 320.3934, "r_y2": 152.47400000000005, "r_x3": 316.57742, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 312.19775, "t": 120.57050000000004, "r": 316.01376, "b": 126.40252999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.19775, "r_y0": 126.40252999999996, "r_x1": 316.01376, "r_y1": 126.40252999999996, "r_x2": 316.01376, "r_y2": 120.57050000000004, "r_x3": 312.19775, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 316.01196, "t": 120.57050000000004, "r": 319.82794, "b": 126.40252999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01196, "r_y0": 126.40252999999996, "r_x1": 319.82794, "r_y1": 126.40252999999996, "r_x2": 319.82794, "r_y2": 120.57050000000004, "r_x3": 316.01196, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 312.8165, "t": 90.1087, "r": 316.63251, "b": 95.94073000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8165, "r_y0": 95.94073000000003, "r_x1": 316.63251, "r_y1": 95.94073000000003, "r_x2": 316.63251, "r_y2": 90.1087, "r_x3": 312.8165, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 316.63071, "t": 90.1087, "r": 320.44669, "b": 95.94073000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63071, "r_y0": 95.94073000000003, "r_x1": 320.44669, "r_y1": 95.94073000000003, "r_x2": 320.44669, "r_y2": 90.1087, "r_x3": 316.63071, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 532.17426, "t": 222.72729000000004, "r": 536.94427, "b": 230.01727000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17426, "r_y0": 230.01727000000005, "r_x1": 536.94427, "r_y1": 230.01727000000005, "r_x2": 536.94427, "r_y2": 222.72729000000004, "r_x3": 532.17426, "r_y3": 222.72729000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 532.87952, "t": 108.26702999999986, "r": 547.61249, "b": 115.55700999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.87952, "r_y0": 115.55700999999999, "r_x1": 547.61249, "r_y1": 115.55700999999999, "r_x2": 547.61249, "r_y2": 108.26702999999986, "r_x3": 532.87952, "r_y3": 108.26702999999986, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 532.7735, "t": 130.78101000000004, "r": 542.73877, "b": 138.07097999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.7735, "r_y0": 138.07097999999996, "r_x1": 542.73877, "r_y1": 138.07097999999996, "r_x2": 542.73877, "r_y2": 130.78101000000004, "r_x3": 532.7735, "r_y3": 130.78101000000004, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 532.79901, "t": 153.92352000000005, "r": 542.76428, "b": 161.21349999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.79901, "r_y0": 161.21349999999995, "r_x1": 542.76428, "r_y1": 161.21349999999995, "r_x2": 542.76428, "r_y2": 153.92352000000005, "r_x3": 532.79901, "r_y3": 153.92352000000005, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 532.5705, "t": 176.75800000000004, "r": 542.53577, "b": 184.04796999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.5705, "r_y0": 184.04796999999996, "r_x1": 542.53577, "r_y1": 184.04796999999996, "r_x2": 542.53577, "r_y2": 176.75800000000004, "r_x3": 532.5705, "r_y3": 176.75800000000004, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 532.14551, "t": 199.6463, "r": 542.11078, "b": 206.93628, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.14551, "r_y0": 206.93628, "r_x1": 542.11078, "r_y1": 206.93628, "r_x2": 542.11078, "r_y2": 199.6463, "r_x3": 532.14551, "r_y3": 199.6463, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 7, "page_no": 2, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 308.862, "t": 267.83636, "r": 545.11511, "b": 288.6979099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9667505025863647, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 276.74292, "r_x1": 346.06238, "r_y1": 276.74292, "r_x2": 346.06238, "r_y2": 267.83636, "r_x3": 308.862, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49072, "r_y0": 276.74292, "r_x1": 545.11511, "r_y1": 276.74292, "r_x2": 545.11511, "r_y2": 267.83636, "r_x3": 354.49072, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 288.6979099999999, "r_x1": 498.56989, "r_y1": 288.6979099999999, "r_x2": 498.56989, "r_y2": 279.79132000000004, "r_x3": 308.862, "r_y3": 279.79132000000004, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets" }, { "label": "text", "id": 9, "page_no": 2, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.862, "t": 317.47336, "r": 437.27002, "b": 326.37991, "coord_origin": "TOPLEFT" }, "confidence": 0.8879811763763428, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 326.37991, "r_x1": 437.27002, "r_y1": 326.37991, "r_x2": 437.27002, "r_y2": 317.47336, "r_x3": 308.862, "r_y3": 317.47336, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "balance in the previous datasets." }, { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.862, "t": 331.53137, "r": 545.11517, "b": 627.36174, "coord_origin": "TOPLEFT" }, "confidence": 0.9870319366455078, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 340.43793, "r_x1": 545.11505, "r_y1": 340.43793, "r_x2": 545.11505, "r_y2": 331.53137, "r_x3": 320.81699, "r_y3": 331.53137, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 352.39291, "r_x1": 545.11517, "r_y1": 352.39291, "r_x2": 545.11517, "r_y2": 343.48635999999993, "r_x3": 308.862, "r_y3": 343.48635999999993, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 364.34890999999993, "r_x1": 545.11505, "r_y1": 364.34890999999993, "r_x2": 545.11505, "r_y2": 355.44235, "r_x3": 308.862, "r_y3": 355.44235, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 376.30389, "r_x1": 545.11505, "r_y1": 376.30389, "r_x2": 545.11505, "r_y2": 367.39734, "r_x3": 308.862, "r_y3": 367.39734, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 388.25888, "r_x1": 545.11511, "r_y1": 388.25888, "r_x2": 545.11511, "r_y2": 379.35233, "r_x3": 308.862, "r_y3": 379.35233, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.21386999999993, "r_x1": 545.11511, "r_y1": 400.21386999999993, "r_x2": 545.11511, "r_y2": 391.30731, "r_x3": 308.862, "r_y3": 391.30731, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.16885, "r_x1": 545.11505, "r_y1": 412.16885, "r_x2": 545.11505, "r_y2": 403.26230000000004, "r_x3": 308.862, "r_y3": 403.26230000000004, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.12384, "r_x1": 545.11511, "r_y1": 424.12384, "r_x2": 545.11511, "r_y2": 415.21729, "r_x3": 308.862, "r_y3": 415.21729, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.0798300000001, "r_x1": 545.11517, "r_y1": 436.0798300000001, "r_x2": 545.11517, "r_y2": 427.17328, "r_x3": 308.862, "r_y3": 427.17328, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.03482, "r_x1": 545.11517, "r_y1": 448.03482, "r_x2": 545.11517, "r_y2": 439.12827, "r_x3": 308.862, "r_y3": 439.12827, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 459.98981000000003, "r_x1": 545.11511, "r_y1": 459.98981000000003, "r_x2": 545.11511, "r_y2": 451.08325, "r_x3": 308.862, "r_y3": 451.08325, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 471.94479, "r_x1": 545.11505, "r_y1": 471.94479, "r_x2": 545.11505, "r_y2": 463.03824, "r_x3": 308.862, "r_y3": 463.03824, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 483.89978, "r_x1": 545.11511, "r_y1": 483.89978, "r_x2": 545.11511, "r_y2": 474.99323, "r_x3": 308.862, "r_y3": 474.99323, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 495.85577, "r_x1": 545.11511, "r_y1": 495.85577, "r_x2": 545.11511, "r_y2": 486.94922, "r_x3": 308.862, "r_y3": 486.94922, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 507.81076, "r_x1": 545.11511, "r_y1": 507.81076, "r_x2": 545.11511, "r_y2": 498.90421, "r_x3": 308.862, "r_y3": 498.90421, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 519.76575, "r_x1": 545.11517, "r_y1": 519.76575, "r_x2": 545.11517, "r_y2": 510.85919, "r_x3": 308.862, "r_y3": 510.85919, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 531.72073, "r_x1": 545.11517, "r_y1": 531.72073, "r_x2": 545.11517, "r_y2": 522.8141800000001, "r_x3": 308.862, "r_y3": 522.8141800000001, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 543.67574, "r_x1": 545.11505, "r_y1": 543.67574, "r_x2": 545.11505, "r_y2": 534.76917, "r_x3": 308.862, "r_y3": 534.76917, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 555.6307400000001, "r_x1": 545.11511, "r_y1": 555.6307400000001, "r_x2": 545.11511, "r_y2": 546.72418, "r_x3": 308.862, "r_y3": 546.72418, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 567.58673, "r_x1": 545.11511, "r_y1": 567.58673, "r_x2": 545.11511, "r_y2": 558.6801800000001, "r_x3": 308.862, "r_y3": 558.6801800000001, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 579.54173, "r_x1": 545.11505, "r_y1": 579.54173, "r_x2": 545.11505, "r_y2": 570.63518, "r_x3": 308.862, "r_y3": 570.63518, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 591.49673, "r_x1": 545.11499, "r_y1": 591.49673, "r_x2": 545.11499, "r_y2": 582.59018, "r_x3": 308.862, "r_y3": 582.59018, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 603.45174, "r_x1": 545.11517, "r_y1": 603.45174, "r_x2": 545.11517, "r_y2": 594.54518, "r_x3": 308.862, "r_y3": 594.54518, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 615.40674, "r_x1": 545.11511, "r_y1": 615.40674, "r_x2": 545.11511, "r_y2": 606.50018, "r_x3": 308.862, "r_y3": 606.50018, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 627.36174, "r_x1": 348.16446, "r_y1": 627.36174, "r_x2": 348.16446, "r_y2": 618.45518, "r_x3": 308.862, "r_y3": 618.45518, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits." }, { "label": "text", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.862, "t": 632.51419, "r": 545.11511, "b": 713.151764, "coord_origin": "TOPLEFT" }, "confidence": 0.9840091466903687, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 641.42075, "r_x1": 545.11487, "r_y1": 641.42075, "r_x2": 545.11487, "r_y2": 632.51419, "r_x3": 320.81699, "r_y3": 632.51419, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.37575, "r_x1": 545.11511, "r_y1": 653.37575, "r_x2": 545.11511, "r_y2": 644.46919, "r_x3": 308.862, "r_y3": 644.46919, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.33076, "r_x1": 545.11511, "r_y1": 665.33076, "r_x2": 545.11511, "r_y2": 656.42419, "r_x3": 308.862, "r_y3": 656.42419, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28676, "r_x1": 545.11499, "r_y1": 677.28676, "r_x2": 545.11499, "r_y2": 668.38019, "r_x3": 308.862, "r_y3": 668.38019, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24176, "r_x1": 545.11505, "r_y1": 689.24176, "r_x2": 545.11505, "r_y2": 680.33519, "r_x3": 308.862, "r_y3": 680.33519, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196762, "r_x1": 545.11505, "r_y1": 701.196762, "r_x2": 545.11505, "r_y2": 692.290192, "r_x3": 308.862, "r_y3": 692.290192, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151764, "r_x1": 545.11511, "r_y1": 713.151764, "r_x2": 545.11511, "r_y2": 704.245193, "r_x3": 308.862, "r_y3": 704.245193, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small" }, { "label": "page_footer", "id": 11, "page_no": 2, "cluster": { "id": 11, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133198, "r": 300.10229, "b": 743.039761, "coord_origin": "TOPLEFT" }, "confidence": 0.8715606927871704, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039761, "r_x1": 300.10229, "r_y1": 743.039761, "r_x2": 300.10229, "r_y2": 734.133198, "r_x3": 295.121, "r_y3": 734.133198, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" } ], "body": [ { "label": "text", "id": 10, "page_no": 2, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 250.15102, "b": 84.11492999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.8767216801643372, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 250.15102, "r_y1": 84.11492999999996, "r_x2": 250.15102, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tag-decoder which is constrained to the table-tags." }, { "label": "text", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.112, "t": 87.21935999999994, "r": 286.36514, "b": 275.45410000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9822593927383423, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.12591999999995, "r_x1": 70.365845, "r_y1": 96.12591999999995, "r_x2": 70.365845, "r_y2": 87.21935999999994, "r_x3": 62.067001, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.931198, "r_y0": 96.12591999999995, "r_x1": 110.95348000000001, "r_y1": 96.12591999999995, "r_x2": 110.95348000000001, "r_y2": 87.21935999999994, "r_x3": 76.931198, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54498, "r_y0": 96.12591999999995, "r_x1": 136.25848, "r_y1": 96.12591999999995, "r_x2": 136.25848, "r_y2": 87.21935999999994, "r_x3": 118.54498, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82384, "r_y0": 96.12591999999995, "r_x1": 175.37166, "r_y1": 96.12591999999995, "r_x2": 175.37166, "r_y2": 87.21935999999994, "r_x3": 142.82384, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.94698, "r_y0": 96.12591999999995, "r_x1": 232.83594000000002, "r_y1": 96.12591999999995, "r_x2": 232.83594000000002, "r_y2": 87.21935999999994, "r_x3": 181.94698, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41125, "r_y0": 96.12591999999995, "r_x1": 265.41364, "r_y1": 96.12591999999995, "r_x2": 265.41364, "r_y2": 87.21935999999994, "r_x3": 239.41125, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.979, "r_y0": 96.12591999999995, "r_x1": 286.36499, "r_y1": 96.12591999999995, "r_x2": 286.36499, "r_y2": 87.21935999999994, "r_x3": 271.979, "r_y3": 87.21935999999994, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.08092999999997, "r_x1": 286.36505, "r_y1": 108.08092999999997, "r_x2": 286.36505, "r_y2": 99.17437999999993, "r_x3": 50.112, "r_y3": 99.17437999999993, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 120.03692999999998, "r_x1": 286.36511, "r_y1": 120.03692999999998, "r_x2": 286.36511, "r_y2": 111.13036999999997, "r_x3": 50.112, "r_y3": 111.13036999999997, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.99194, "r_x1": 286.36505, "r_y1": 131.99194, "r_x2": 286.36505, "r_y2": 123.08538999999996, "r_x3": 50.112, "r_y3": 123.08538999999996, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.94696, "r_x1": 286.36514, "r_y1": 143.94696, "r_x2": 286.36514, "r_y2": 135.04040999999995, "r_x3": 50.112, "r_y3": 135.04040999999995, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.90197999999998, "r_x1": 286.36511, "r_y1": 155.90197999999998, "r_x2": 286.36511, "r_y2": 146.99541999999997, "r_x3": 50.112, "r_y3": 146.99541999999997, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 167.85699, "r_x1": 286.36505, "r_y1": 167.85699, "r_x2": 286.36505, "r_y2": 158.95043999999996, "r_x3": 50.112, "r_y3": 158.95043999999996, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 179.81201, "r_x1": 286.36508, "r_y1": 179.81201, "r_x2": 286.36508, "r_y2": 170.90545999999995, "r_x3": 50.112, "r_y3": 170.90545999999995, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 191.76801, "r_x1": 286.36508, "r_y1": 191.76801, "r_x2": 286.36508, "r_y2": 182.86145, "r_x3": 50.112, "r_y3": 182.86145, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 203.72302000000002, "r_x1": 286.36511, "r_y1": 203.72302000000002, "r_x2": 286.36511, "r_y2": 194.81646999999998, "r_x3": 50.112, "r_y3": 194.81646999999998, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 215.67804, "r_x1": 286.36511, "r_y1": 215.67804, "r_x2": 286.36511, "r_y2": 206.77148, "r_x3": 50.112, "r_y3": 206.77148, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 227.63306, "r_x1": 286.36505, "r_y1": 227.63306, "r_x2": 286.36505, "r_y2": 218.7265, "r_x3": 50.112, "r_y3": 218.7265, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 239.58807000000002, "r_x1": 286.36505, "r_y1": 239.58807000000002, "r_x2": 286.36505, "r_y2": 230.68151999999998, "r_x3": 50.112, "r_y3": 230.68151999999998, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 251.54309, "r_x1": 286.36511, "r_y1": 251.54309, "r_x2": 286.36511, "r_y2": 242.63653999999997, "r_x3": 50.112, "r_y3": 242.63653999999997, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 263.49908000000005, "r_x1": 286.36508, "r_y1": 263.49908000000005, "r_x2": 286.36508, "r_y2": 254.59253, "r_x3": 50.112, "r_y3": 254.59253, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 275.45410000000004, "r_x1": 64.776947, "r_y1": 275.45410000000004, "r_x2": 64.776947, "r_y2": 266.54755, "r_x3": 50.112, "r_y3": 266.54755, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.111992, "t": 278.43895999999995, "r": 286.36511, "b": 490.70288, "coord_origin": "TOPLEFT" }, "confidence": 0.9878450036048889, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 287.39536, "r_x1": 171.56593, "r_y1": 287.39536, "r_x2": 171.56593, "r_y2": 278.43895999999995, "r_x3": 62.067001, "r_y3": 278.43895999999995, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.56799, "r_y0": 287.46509, "r_x1": 174.3376, "r_y1": 287.46509, "r_x2": 174.3376, "r_y2": 278.55853, "r_x3": 171.56799, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.18687, "r_y0": 287.46509, "r_x1": 286.35709, "r_y1": 287.46509, "r_x2": 286.35709, "r_y2": 278.55853, "r_x3": 185.18687, "r_y3": 278.55853, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 299.42108, "r_x1": 286.36511, "r_y1": 299.42108, "r_x2": 286.36511, "r_y2": 290.51453000000004, "r_x3": 50.111992, "r_y3": 290.51453000000004, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 311.37607, "r_x1": 131.16771, "r_y1": 311.37607, "r_x2": 131.16771, "r_y2": 302.46950999999996, "r_x3": 50.111992, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.84888, "r_y0": 311.37607, "r_x1": 286.36508, "r_y1": 311.37607, "r_x2": 286.36508, "r_y2": 302.46950999999996, "r_x3": 138.84888, "r_y3": 302.46950999999996, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 323.33105, "r_x1": 286.36505, "r_y1": 323.33105, "r_x2": 286.36505, "r_y2": 314.4245, "r_x3": 50.111992, "r_y3": 314.4245, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 335.28604, "r_x1": 286.36508, "r_y1": 335.28604, "r_x2": 286.36508, "r_y2": 326.37949000000003, "r_x3": 50.111992, "r_y3": 326.37949000000003, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 347.2410300000001, "r_x1": 286.36505, "r_y1": 347.2410300000001, "r_x2": 286.36505, "r_y2": 338.33447, "r_x3": 50.111992, "r_y3": 338.33447, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 359.19601, "r_x1": 286.36505, "r_y1": 359.19601, "r_x2": 286.36505, "r_y2": 350.28946, "r_x3": 50.111992, "r_y3": 350.28946, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 371.15201, "r_x1": 286.36508, "r_y1": 371.15201, "r_x2": 286.36508, "r_y2": 362.24545000000006, "r_x3": 50.111992, "r_y3": 362.24545000000006, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 383.10699, "r_x1": 286.36508, "r_y1": 383.10699, "r_x2": 286.36508, "r_y2": 374.20044, "r_x3": 50.111992, "r_y3": 374.20044, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 395.06198, "r_x1": 286.36508, "r_y1": 395.06198, "r_x2": 286.36508, "r_y2": 386.15542999999997, "r_x3": 50.111992, "r_y3": 386.15542999999997, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 407.01697, "r_x1": 286.36508, "r_y1": 407.01697, "r_x2": 286.36508, "r_y2": 398.11041000000006, "r_x3": 50.111992, "r_y3": 398.11041000000006, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 418.97195, "r_x1": 286.36508, "r_y1": 418.97195, "r_x2": 286.36508, "r_y2": 410.0654, "r_x3": 50.111992, "r_y3": 410.0654, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 430.92694, "r_x1": 286.36505, "r_y1": 430.92694, "r_x2": 286.36505, "r_y2": 422.02038999999996, "r_x3": 50.111992, "r_y3": 422.02038999999996, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 442.88293, "r_x1": 198.2359, "r_y1": 442.88293, "r_x2": 198.2359, "r_y2": 433.97638, "r_x3": 50.111992, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.92703, "r_y0": 442.88293, "r_x1": 286.36505, "r_y1": 442.88293, "r_x2": 286.36505, "r_y2": 433.97638, "r_x3": 205.92703, "r_y3": 433.97638, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 454.83792000000005, "r_x1": 286.36508, "r_y1": 454.83792000000005, "r_x2": 286.36508, "r_y2": 445.93137, "r_x3": 50.111992, "r_y3": 445.93137, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 466.79291, "r_x1": 286.36505, "r_y1": 466.79291, "r_x2": 286.36505, "r_y2": 457.88635, "r_x3": 50.111992, "r_y3": 457.88635, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 478.74789, "r_x1": 286.36505, "r_y1": 478.74789, "r_x2": 286.36505, "r_y2": 469.84134, "r_x3": 50.111992, "r_y3": 469.84134, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 490.70288, "r_x1": 186.49998, "r_y1": 490.70288, "r_x2": 186.49998, "r_y2": 481.79633, "r_x3": 50.111992, "r_y3": 481.79633, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.111984, "t": 493.68875, "r": 286.36627, "b": 622.26685, "coord_origin": "TOPLEFT" }, "confidence": 0.9875094294548035, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.066994, "r_y0": 502.64514, "r_x1": 252.88068000000004, "r_y1": 502.64514, "r_x2": 252.88068000000004, "r_y2": 493.68875, "r_x3": 62.066994, "r_y3": 493.68875, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88199, "r_y0": 502.71487, "r_x1": 286.36627, "r_y1": 502.71487, "r_x2": 286.36627, "r_y2": 493.80832, "r_x3": 252.88199, "r_y3": 493.80832, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 514.66986, "r_x1": 286.36505, "r_y1": 514.66986, "r_x2": 286.36505, "r_y2": 505.76331, "r_x3": 50.111984, "r_y3": 505.76331, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 526.6248499999999, "r_x1": 286.36505, "r_y1": 526.6248499999999, "r_x2": 286.36505, "r_y2": 517.71829, "r_x3": 50.111984, "r_y3": 517.71829, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 538.57985, "r_x1": 286.36508, "r_y1": 538.57985, "r_x2": 286.36508, "r_y2": 529.67328, "r_x3": 50.111984, "r_y3": 529.67328, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 550.53584, "r_x1": 286.36508, "r_y1": 550.53584, "r_x2": 286.36508, "r_y2": 541.62929, "r_x3": 50.111984, "r_y3": 541.62929, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 562.4908399999999, "r_x1": 286.36511, "r_y1": 562.4908399999999, "r_x2": 286.36511, "r_y2": 553.58429, "r_x3": 50.111984, "r_y3": 553.58429, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 574.44585, "r_x1": 286.36511, "r_y1": 574.44585, "r_x2": 286.36511, "r_y2": 565.5392899999999, "r_x3": 50.111984, "r_y3": 565.5392899999999, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 586.40085, "r_x1": 286.36502, "r_y1": 586.40085, "r_x2": 286.36502, "r_y2": 577.49429, "r_x3": 50.111984, "r_y3": 577.49429, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 598.35585, "r_x1": 286.36505, "r_y1": 598.35585, "r_x2": 286.36505, "r_y2": 589.4493, "r_x3": 50.111984, "r_y3": 589.4493, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 610.31085, "r_x1": 286.36502, "r_y1": 610.31085, "r_x2": 286.36502, "r_y2": 601.4043, "r_x3": 50.111984, "r_y3": 601.4043, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 622.26685, "r_x1": 175.98943, "r_y1": 622.26685, "r_x2": 175.98943, "r_y2": 613.36029, "r_x3": 50.111984, "r_y3": 613.36029, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered." }, { "label": "section_header", "id": 8, "page_no": 2, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 50.111984, "t": 635.94484, "r": 105.22546, "b": 646.6925699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9423062205314636, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 646.6925699999999, "r_x1": 57.82375699999999, "r_y1": 646.6925699999999, "r_x2": 57.82375699999999, "r_y2": 635.94484, "r_x3": 50.111984, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.106125, "r_y0": 646.6925699999999, "r_x1": 105.22546, "r_y1": 646.6925699999999, "r_x2": 105.22546, "r_y2": 635.94484, "r_x3": 68.106125, "r_y3": 635.94484, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Datasets" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.111984, "t": 656.42529, "r": 286.36508, "b": 713.151863, "coord_origin": "TOPLEFT" }, "confidence": 0.9862047433853149, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 665.33186, "r_x1": 286.36493, "r_y1": 665.33186, "r_x2": 286.36493, "r_y2": 656.42529, "r_x3": 62.06698600000001, "r_y3": 656.42529, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 677.2868599999999, "r_x1": 286.36508, "r_y1": 677.2868599999999, "r_x2": 286.36508, "r_y2": 668.38029, "r_x3": 50.111984, "r_y3": 668.38029, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 689.24186, "r_x1": 286.36502, "r_y1": 689.24186, "r_x2": 286.36502, "r_y2": 680.3353, "r_x3": 50.111984, "r_y3": 680.3353, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 701.196861, "r_x1": 166.24602, "r_y1": 701.196861, "r_x2": 166.24602, "r_y2": 692.290298, "r_x3": 50.111984, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.68808, "r_y0": 701.196861, "r_x1": 286.36508, "r_y1": 701.196861, "r_x2": 286.36508, "r_y2": 692.290298, "r_x3": 173.68808, "r_y3": 692.290298, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 713.151863, "r_x1": 286.36505, "r_y1": 713.151863, "r_x2": 286.36505, "r_y2": 704.2453, "r_x3": 50.111984, "r_y3": 704.2453, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-" }, { "label": "picture", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT" }, "confidence": 0.9746918082237244, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.79849, "r_y0": 88.55975000000001, "r_x1": 486.84909, "r_y1": 88.55975000000001, "r_x2": 486.84909, "r_y2": 79.81176999999991, "r_x3": 380.79849, "r_y3": 79.81176999999991, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.76776, "r_y0": 250.77495999999996, "r_x1": 469.78748, "r_y1": 250.77495999999996, "r_x2": 469.78748, "r_y2": 242.02697999999998, "r_x3": 396.76776, "r_y3": 242.02697999999998, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.97653, "r_y0": 239.255, "r_x1": 324.79254, "r_y1": 239.255, "r_x2": 324.79254, "r_y2": 233.42296999999996, "r_x3": 320.97653, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.483, "r_y0": 239.255, "r_x1": 418.11319, "r_y1": 239.255, "r_x2": 418.11319, "r_y2": 233.42296999999996, "r_x3": 410.483, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.84949, "r_y0": 239.255, "r_x1": 508.47968000000003, "r_y1": 239.255, "r_x2": 508.47968000000003, "r_y2": 233.42296999999996, "r_x3": 500.84949, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.29999, "r_y0": 239.255, "r_x1": 372.93018, "r_y1": 239.255, "r_x2": 372.93018, "r_y2": 233.42296999999996, "r_x3": 365.29999, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.66626, "r_y0": 239.255, "r_x1": 463.29645, "r_y1": 239.255, "r_x2": 463.29645, "r_y2": 233.42296999999996, "r_x3": 455.66626, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.03528, "r_y0": 239.255, "r_x1": 549.66547, "r_y1": 239.255, "r_x2": 549.66547, "r_y2": 233.42296999999996, "r_x3": 542.03528, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04474, "r_y0": 236.27819999999997, "r_x1": 319.86075, "r_y1": 236.27819999999997, "r_x2": 319.86075, "r_y2": 230.44617000000005, "r_x3": 316.04474, "r_y3": 230.44617000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.62521, "r_y0": 204.52277000000004, "r_x1": 316.44122, "r_y1": 204.52277000000004, "r_x2": 316.44122, "r_y2": 198.69073000000003, "r_x3": 312.62521, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.43942, "r_y0": 204.52277000000004, "r_x1": 320.2554, "r_y1": 204.52277000000004, "r_x2": 320.2554, "r_y2": 198.69073000000003, "r_x3": 316.43942, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.14951, "r_y0": 173.92998999999998, "r_x1": 316.96552, "r_y1": 173.92998999999998, "r_x2": 316.96552, "r_y2": 168.09795999999994, "r_x3": 313.14951, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96371, "r_y0": 173.92998999999998, "r_x1": 320.77969, "r_y1": 173.92998999999998, "r_x2": 320.77969, "r_y2": 168.09795999999994, "r_x3": 316.96371, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.92972, "r_y0": 142.41974000000005, "r_x1": 316.74573, "r_y1": 142.41974000000005, "r_x2": 316.74573, "r_y2": 136.58771000000002, "r_x3": 312.92972, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74393, "r_y0": 142.41974000000005, "r_x1": 320.55991, "r_y1": 142.41974000000005, "r_x2": 320.55991, "r_y2": 136.58771000000002, "r_x3": 316.74393, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 111.43377999999996, "r_x1": 316.29828, "r_y1": 111.43377999999996, "r_x2": 316.29828, "r_y2": 105.60175000000004, "r_x3": 312.48227, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 111.43377999999996, "r_x1": 320.11246, "r_y1": 111.43377999999996, "r_x2": 320.11246, "r_y2": 105.60175000000004, "r_x3": 316.29648, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 218.09124999999995, "r_x1": 316.29828, "r_y1": 218.09124999999995, "r_x2": 316.29828, "r_y2": 212.25922000000003, "r_x3": 312.48227, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 218.09124999999995, "r_x1": 320.11246, "r_y1": 218.09124999999995, "r_x2": 320.11246, "r_y2": 212.25922000000003, "r_x3": 316.29648, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.07639, "r_y0": 189.55402000000004, "r_x1": 316.8924, "r_y1": 189.55402000000004, "r_x2": 316.8924, "r_y2": 183.72198000000003, "r_x3": 313.07639, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89059, "r_y0": 189.55402000000004, "r_x1": 320.70657, "r_y1": 189.55402000000004, "r_x2": 320.70657, "r_y2": 183.72198000000003, "r_x3": 316.89059, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76321, "r_y0": 158.30602999999996, "r_x1": 316.57922, "r_y1": 158.30602999999996, "r_x2": 316.57922, "r_y2": 152.47400000000005, "r_x3": 312.76321, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.57742, "r_y0": 158.30602999999996, "r_x1": 320.3934, "r_y1": 158.30602999999996, "r_x2": 320.3934, "r_y2": 152.47400000000005, "r_x3": 316.57742, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.19775, "r_y0": 126.40252999999996, "r_x1": 316.01376, "r_y1": 126.40252999999996, "r_x2": 316.01376, "r_y2": 120.57050000000004, "r_x3": 312.19775, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01196, "r_y0": 126.40252999999996, "r_x1": 319.82794, "r_y1": 126.40252999999996, "r_x2": 319.82794, "r_y2": 120.57050000000004, "r_x3": 316.01196, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8165, "r_y0": 95.94073000000003, "r_x1": 316.63251, "r_y1": 95.94073000000003, "r_x2": 316.63251, "r_y2": 90.1087, "r_x3": 312.8165, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63071, "r_y0": 95.94073000000003, "r_x1": 320.44669, "r_y1": 95.94073000000003, "r_x2": 320.44669, "r_y2": 90.1087, "r_x3": 316.63071, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17426, "r_y0": 230.01727000000005, "r_x1": 536.94427, "r_y1": 230.01727000000005, "r_x2": 536.94427, "r_y2": 222.72729000000004, "r_x3": 532.17426, "r_y3": 222.72729000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.87952, "r_y0": 115.55700999999999, "r_x1": 547.61249, "r_y1": 115.55700999999999, "r_x2": 547.61249, "r_y2": 108.26702999999986, "r_x3": 532.87952, "r_y3": 108.26702999999986, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.7735, "r_y0": 138.07097999999996, "r_x1": 542.73877, "r_y1": 138.07097999999996, "r_x2": 542.73877, "r_y2": 130.78101000000004, "r_x3": 532.7735, "r_y3": 130.78101000000004, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.79901, "r_y0": 161.21349999999995, "r_x1": 542.76428, "r_y1": 161.21349999999995, "r_x2": 542.76428, "r_y2": 153.92352000000005, "r_x3": 532.79901, "r_y3": 153.92352000000005, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.5705, "r_y0": 184.04796999999996, "r_x1": 542.53577, "r_y1": 184.04796999999996, "r_x2": 542.53577, "r_y2": 176.75800000000004, "r_x3": 532.5705, "r_y3": 176.75800000000004, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.14551, "r_y0": 206.93628, "r_x1": 542.11078, "r_y1": 206.93628, "r_x2": 542.11078, "r_y2": 199.6463, "r_x3": 532.14551, "r_y3": 199.6463, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 12, "label": "section_header", "bbox": { "l": 380.79849, "t": 79.81176999999991, "r": 486.84909, "b": 88.55975000000001, "coord_origin": "TOPLEFT" }, "confidence": 0.5687217116355896, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.79849, "r_y0": 88.55975000000001, "r_x1": 486.84909, "r_y1": 88.55975000000001, "r_x2": 486.84909, "r_y2": 79.81176999999991, "r_x3": 380.79849, "r_y3": 79.81176999999991, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 396.76776, "t": 242.02697999999998, "r": 469.78748, "b": 250.77495999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.76776, "r_y0": 250.77495999999996, "r_x1": 469.78748, "r_y1": 250.77495999999996, "r_x2": 469.78748, "r_y2": 242.02697999999998, "r_x3": 396.76776, "r_y3": 242.02697999999998, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 320.97653, "t": 233.42296999999996, "r": 324.79254, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.97653, "r_y0": 239.255, "r_x1": 324.79254, "r_y1": 239.255, "r_x2": 324.79254, "r_y2": 233.42296999999996, "r_x3": 320.97653, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 410.483, "t": 233.42296999999996, "r": 418.11319, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.483, "r_y0": 239.255, "r_x1": 418.11319, "r_y1": 239.255, "r_x2": 418.11319, "r_y2": 233.42296999999996, "r_x3": 410.483, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 500.84949, "t": 233.42296999999996, "r": 508.47968000000003, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.84949, "r_y0": 239.255, "r_x1": 508.47968000000003, "r_y1": 239.255, "r_x2": 508.47968000000003, "r_y2": 233.42296999999996, "r_x3": 500.84949, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 365.29999, "t": 233.42296999999996, "r": 372.93018, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.29999, "r_y0": 239.255, "r_x1": 372.93018, "r_y1": 239.255, "r_x2": 372.93018, "r_y2": 233.42296999999996, "r_x3": 365.29999, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 455.66626, "t": 233.42296999999996, "r": 463.29645, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.66626, "r_y0": 239.255, "r_x1": 463.29645, "r_y1": 239.255, "r_x2": 463.29645, "r_y2": 233.42296999999996, "r_x3": 455.66626, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 542.03528, "t": 233.42296999999996, "r": 549.66547, "b": 239.255, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.03528, "r_y0": 239.255, "r_x1": 549.66547, "r_y1": 239.255, "r_x2": 549.66547, "r_y2": 233.42296999999996, "r_x3": 542.03528, "r_y3": 233.42296999999996, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 316.04474, "t": 230.44617000000005, "r": 319.86075, "b": 236.27819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04474, "r_y0": 236.27819999999997, "r_x1": 319.86075, "r_y1": 236.27819999999997, "r_x2": 319.86075, "r_y2": 230.44617000000005, "r_x3": 316.04474, "r_y3": 230.44617000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 312.62521, "t": 198.69073000000003, "r": 316.44122, "b": 204.52277000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.62521, "r_y0": 204.52277000000004, "r_x1": 316.44122, "r_y1": 204.52277000000004, "r_x2": 316.44122, "r_y2": 198.69073000000003, "r_x3": 312.62521, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 316.43942, "t": 198.69073000000003, "r": 320.2554, "b": 204.52277000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.43942, "r_y0": 204.52277000000004, "r_x1": 320.2554, "r_y1": 204.52277000000004, "r_x2": 320.2554, "r_y2": 198.69073000000003, "r_x3": 316.43942, "r_y3": 198.69073000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 313.14951, "t": 168.09795999999994, "r": 316.96552, "b": 173.92998999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.14951, "r_y0": 173.92998999999998, "r_x1": 316.96552, "r_y1": 173.92998999999998, "r_x2": 316.96552, "r_y2": 168.09795999999994, "r_x3": 313.14951, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 316.96371, "t": 168.09795999999994, "r": 320.77969, "b": 173.92998999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96371, "r_y0": 173.92998999999998, "r_x1": 320.77969, "r_y1": 173.92998999999998, "r_x2": 320.77969, "r_y2": 168.09795999999994, "r_x3": 316.96371, "r_y3": 168.09795999999994, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 312.92972, "t": 136.58771000000002, "r": 316.74573, "b": 142.41974000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.92972, "r_y0": 142.41974000000005, "r_x1": 316.74573, "r_y1": 142.41974000000005, "r_x2": 316.74573, "r_y2": 136.58771000000002, "r_x3": 312.92972, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 316.74393, "t": 136.58771000000002, "r": 320.55991, "b": 142.41974000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74393, "r_y0": 142.41974000000005, "r_x1": 320.55991, "r_y1": 142.41974000000005, "r_x2": 320.55991, "r_y2": 136.58771000000002, "r_x3": 316.74393, "r_y3": 136.58771000000002, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 312.48227, "t": 105.60175000000004, "r": 316.29828, "b": 111.43377999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 111.43377999999996, "r_x1": 316.29828, "r_y1": 111.43377999999996, "r_x2": 316.29828, "r_y2": 105.60175000000004, "r_x3": 312.48227, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 316.29648, "t": 105.60175000000004, "r": 320.11246, "b": 111.43377999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 111.43377999999996, "r_x1": 320.11246, "r_y1": 111.43377999999996, "r_x2": 320.11246, "r_y2": 105.60175000000004, "r_x3": 316.29648, "r_y3": 105.60175000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 312.48227, "t": 212.25922000000003, "r": 316.29828, "b": 218.09124999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48227, "r_y0": 218.09124999999995, "r_x1": 316.29828, "r_y1": 218.09124999999995, "r_x2": 316.29828, "r_y2": 212.25922000000003, "r_x3": 312.48227, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 316.29648, "t": 212.25922000000003, "r": 320.11246, "b": 218.09124999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.29648, "r_y0": 218.09124999999995, "r_x1": 320.11246, "r_y1": 218.09124999999995, "r_x2": 320.11246, "r_y2": 212.25922000000003, "r_x3": 316.29648, "r_y3": 212.25922000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 313.07639, "t": 183.72198000000003, "r": 316.8924, "b": 189.55402000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.07639, "r_y0": 189.55402000000004, "r_x1": 316.8924, "r_y1": 189.55402000000004, "r_x2": 316.8924, "r_y2": 183.72198000000003, "r_x3": 313.07639, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 316.89059, "t": 183.72198000000003, "r": 320.70657, "b": 189.55402000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89059, "r_y0": 189.55402000000004, "r_x1": 320.70657, "r_y1": 189.55402000000004, "r_x2": 320.70657, "r_y2": 183.72198000000003, "r_x3": 316.89059, "r_y3": 183.72198000000003, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 312.76321, "t": 152.47400000000005, "r": 316.57922, "b": 158.30602999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76321, "r_y0": 158.30602999999996, "r_x1": 316.57922, "r_y1": 158.30602999999996, "r_x2": 316.57922, "r_y2": 152.47400000000005, "r_x3": 312.76321, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 316.57742, "t": 152.47400000000005, "r": 320.3934, "b": 158.30602999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.57742, "r_y0": 158.30602999999996, "r_x1": 320.3934, "r_y1": 158.30602999999996, "r_x2": 320.3934, "r_y2": 152.47400000000005, "r_x3": 316.57742, "r_y3": 152.47400000000005, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 312.19775, "t": 120.57050000000004, "r": 316.01376, "b": 126.40252999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.19775, "r_y0": 126.40252999999996, "r_x1": 316.01376, "r_y1": 126.40252999999996, "r_x2": 316.01376, "r_y2": 120.57050000000004, "r_x3": 312.19775, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 316.01196, "t": 120.57050000000004, "r": 319.82794, "b": 126.40252999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01196, "r_y0": 126.40252999999996, "r_x1": 319.82794, "r_y1": 126.40252999999996, "r_x2": 319.82794, "r_y2": 120.57050000000004, "r_x3": 316.01196, "r_y3": 120.57050000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 312.8165, "t": 90.1087, "r": 316.63251, "b": 95.94073000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8165, "r_y0": 95.94073000000003, "r_x1": 316.63251, "r_y1": 95.94073000000003, "r_x2": 316.63251, "r_y2": 90.1087, "r_x3": 312.8165, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 316.63071, "t": 90.1087, "r": 320.44669, "b": 95.94073000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63071, "r_y0": 95.94073000000003, "r_x1": 320.44669, "r_y1": 95.94073000000003, "r_x2": 320.44669, "r_y2": 90.1087, "r_x3": 316.63071, "r_y3": 90.1087, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 532.17426, "t": 222.72729000000004, "r": 536.94427, "b": 230.01727000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17426, "r_y0": 230.01727000000005, "r_x1": 536.94427, "r_y1": 230.01727000000005, "r_x2": 536.94427, "r_y2": 222.72729000000004, "r_x3": 532.17426, "r_y3": 222.72729000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 532.87952, "t": 108.26702999999986, "r": 547.61249, "b": 115.55700999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.87952, "r_y0": 115.55700999999999, "r_x1": 547.61249, "r_y1": 115.55700999999999, "r_x2": 547.61249, "r_y2": 108.26702999999986, "r_x3": 532.87952, "r_y3": 108.26702999999986, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 532.7735, "t": 130.78101000000004, "r": 542.73877, "b": 138.07097999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.7735, "r_y0": 138.07097999999996, "r_x1": 542.73877, "r_y1": 138.07097999999996, "r_x2": 542.73877, "r_y2": 130.78101000000004, "r_x3": 532.7735, "r_y3": 130.78101000000004, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 532.79901, "t": 153.92352000000005, "r": 542.76428, "b": 161.21349999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.79901, "r_y0": 161.21349999999995, "r_x1": 542.76428, "r_y1": 161.21349999999995, "r_x2": 542.76428, "r_y2": 153.92352000000005, "r_x3": 532.79901, "r_y3": 153.92352000000005, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 532.5705, "t": 176.75800000000004, "r": 542.53577, "b": 184.04796999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.5705, "r_y0": 184.04796999999996, "r_x1": 542.53577, "r_y1": 184.04796999999996, "r_x2": 542.53577, "r_y2": 176.75800000000004, "r_x3": 532.5705, "r_y3": 176.75800000000004, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 532.14551, "t": 199.6463, "r": 542.11078, "b": 206.93628, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.14551, "r_y0": 206.93628, "r_x1": 542.11078, "r_y1": 206.93628, "r_x2": 542.11078, "r_y2": 199.6463, "r_x3": 532.14551, "r_y3": 199.6463, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 7, "page_no": 2, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 308.862, "t": 267.83636, "r": 545.11511, "b": 288.6979099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9667505025863647, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 276.74292, "r_x1": 346.06238, "r_y1": 276.74292, "r_x2": 346.06238, "r_y2": 267.83636, "r_x3": 308.862, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49072, "r_y0": 276.74292, "r_x1": 545.11511, "r_y1": 276.74292, "r_x2": 545.11511, "r_y2": 267.83636, "r_x3": 354.49072, "r_y3": 267.83636, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 288.6979099999999, "r_x1": 498.56989, "r_y1": 288.6979099999999, "r_x2": 498.56989, "r_y2": 279.79132000000004, "r_x3": 308.862, "r_y3": 279.79132000000004, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets" }, { "label": "text", "id": 9, "page_no": 2, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.862, "t": 317.47336, "r": 437.27002, "b": 326.37991, "coord_origin": "TOPLEFT" }, "confidence": 0.8879811763763428, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 326.37991, "r_x1": 437.27002, "r_y1": 326.37991, "r_x2": 437.27002, "r_y2": 317.47336, "r_x3": 308.862, "r_y3": 317.47336, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "balance in the previous datasets." }, { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.862, "t": 331.53137, "r": 545.11517, "b": 627.36174, "coord_origin": "TOPLEFT" }, "confidence": 0.9870319366455078, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 340.43793, "r_x1": 545.11505, "r_y1": 340.43793, "r_x2": 545.11505, "r_y2": 331.53137, "r_x3": 320.81699, "r_y3": 331.53137, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 352.39291, "r_x1": 545.11517, "r_y1": 352.39291, "r_x2": 545.11517, "r_y2": 343.48635999999993, "r_x3": 308.862, "r_y3": 343.48635999999993, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 364.34890999999993, "r_x1": 545.11505, "r_y1": 364.34890999999993, "r_x2": 545.11505, "r_y2": 355.44235, "r_x3": 308.862, "r_y3": 355.44235, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 376.30389, "r_x1": 545.11505, "r_y1": 376.30389, "r_x2": 545.11505, "r_y2": 367.39734, "r_x3": 308.862, "r_y3": 367.39734, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 388.25888, "r_x1": 545.11511, "r_y1": 388.25888, "r_x2": 545.11511, "r_y2": 379.35233, "r_x3": 308.862, "r_y3": 379.35233, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.21386999999993, "r_x1": 545.11511, "r_y1": 400.21386999999993, "r_x2": 545.11511, "r_y2": 391.30731, "r_x3": 308.862, "r_y3": 391.30731, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.16885, "r_x1": 545.11505, "r_y1": 412.16885, "r_x2": 545.11505, "r_y2": 403.26230000000004, "r_x3": 308.862, "r_y3": 403.26230000000004, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.12384, "r_x1": 545.11511, "r_y1": 424.12384, "r_x2": 545.11511, "r_y2": 415.21729, "r_x3": 308.862, "r_y3": 415.21729, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.0798300000001, "r_x1": 545.11517, "r_y1": 436.0798300000001, "r_x2": 545.11517, "r_y2": 427.17328, "r_x3": 308.862, "r_y3": 427.17328, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.03482, "r_x1": 545.11517, "r_y1": 448.03482, "r_x2": 545.11517, "r_y2": 439.12827, "r_x3": 308.862, "r_y3": 439.12827, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 459.98981000000003, "r_x1": 545.11511, "r_y1": 459.98981000000003, "r_x2": 545.11511, "r_y2": 451.08325, "r_x3": 308.862, "r_y3": 451.08325, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 471.94479, "r_x1": 545.11505, "r_y1": 471.94479, "r_x2": 545.11505, "r_y2": 463.03824, "r_x3": 308.862, "r_y3": 463.03824, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 483.89978, "r_x1": 545.11511, "r_y1": 483.89978, "r_x2": 545.11511, "r_y2": 474.99323, "r_x3": 308.862, "r_y3": 474.99323, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 495.85577, "r_x1": 545.11511, "r_y1": 495.85577, "r_x2": 545.11511, "r_y2": 486.94922, "r_x3": 308.862, "r_y3": 486.94922, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 507.81076, "r_x1": 545.11511, "r_y1": 507.81076, "r_x2": 545.11511, "r_y2": 498.90421, "r_x3": 308.862, "r_y3": 498.90421, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 519.76575, "r_x1": 545.11517, "r_y1": 519.76575, "r_x2": 545.11517, "r_y2": 510.85919, "r_x3": 308.862, "r_y3": 510.85919, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 531.72073, "r_x1": 545.11517, "r_y1": 531.72073, "r_x2": 545.11517, "r_y2": 522.8141800000001, "r_x3": 308.862, "r_y3": 522.8141800000001, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 543.67574, "r_x1": 545.11505, "r_y1": 543.67574, "r_x2": 545.11505, "r_y2": 534.76917, "r_x3": 308.862, "r_y3": 534.76917, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 555.6307400000001, "r_x1": 545.11511, "r_y1": 555.6307400000001, "r_x2": 545.11511, "r_y2": 546.72418, "r_x3": 308.862, "r_y3": 546.72418, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 567.58673, "r_x1": 545.11511, "r_y1": 567.58673, "r_x2": 545.11511, "r_y2": 558.6801800000001, "r_x3": 308.862, "r_y3": 558.6801800000001, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 579.54173, "r_x1": 545.11505, "r_y1": 579.54173, "r_x2": 545.11505, "r_y2": 570.63518, "r_x3": 308.862, "r_y3": 570.63518, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 591.49673, "r_x1": 545.11499, "r_y1": 591.49673, "r_x2": 545.11499, "r_y2": 582.59018, "r_x3": 308.862, "r_y3": 582.59018, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 603.45174, "r_x1": 545.11517, "r_y1": 603.45174, "r_x2": 545.11517, "r_y2": 594.54518, "r_x3": 308.862, "r_y3": 594.54518, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 615.40674, "r_x1": 545.11511, "r_y1": 615.40674, "r_x2": 545.11511, "r_y2": 606.50018, "r_x3": 308.862, "r_y3": 606.50018, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 627.36174, "r_x1": 348.16446, "r_y1": 627.36174, "r_x2": 348.16446, "r_y2": 618.45518, "r_x3": 308.862, "r_y3": 618.45518, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits." }, { "label": "text", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.862, "t": 632.51419, "r": 545.11511, "b": 713.151764, "coord_origin": "TOPLEFT" }, "confidence": 0.9840091466903687, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 641.42075, "r_x1": 545.11487, "r_y1": 641.42075, "r_x2": 545.11487, "r_y2": 632.51419, "r_x3": 320.81699, "r_y3": 632.51419, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.37575, "r_x1": 545.11511, "r_y1": 653.37575, "r_x2": 545.11511, "r_y2": 644.46919, "r_x3": 308.862, "r_y3": 644.46919, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.33076, "r_x1": 545.11511, "r_y1": 665.33076, "r_x2": 545.11511, "r_y2": 656.42419, "r_x3": 308.862, "r_y3": 656.42419, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.28676, "r_x1": 545.11499, "r_y1": 677.28676, "r_x2": 545.11499, "r_y2": 668.38019, "r_x3": 308.862, "r_y3": 668.38019, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.24176, "r_x1": 545.11505, "r_y1": 689.24176, "r_x2": 545.11505, "r_y2": 680.33519, "r_x3": 308.862, "r_y3": 680.33519, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 701.196762, "r_x1": 545.11505, "r_y1": 701.196762, "r_x2": 545.11505, "r_y2": 692.290192, "r_x3": 308.862, "r_y3": 692.290192, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 713.151764, "r_x1": 545.11511, "r_y1": 713.151764, "r_x2": 545.11511, "r_y2": 704.245193, "r_x3": 308.862, "r_y3": 704.245193, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small" } ], "headers": [ { "label": "page_footer", "id": 11, "page_no": 2, "cluster": { "id": 11, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133198, "r": 300.10229, "b": 743.039761, "coord_origin": "TOPLEFT" }, "confidence": 0.8715606927871704, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039761, "r_x1": 300.10229, "r_y1": 743.039761, "r_x2": 300.10229, "r_y2": 734.133198, "r_x3": 295.121, "r_y3": 734.133198, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" } ] } }, { "page_no": 3, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36511, "r_y1": 84.11492999999996, "r_x2": 286.36511, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 212.28319, "r_y1": 96.06994999999995, "r_x2": 212.28319, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 109.86694, "r_x1": 286.36502, "r_y1": 109.86694, "r_x2": 286.36502, "r_y2": 100.96038999999996, "r_x3": 62.067001, "r_y3": 100.96038999999996, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 121.82195999999999, "r_x1": 286.36508, "r_y1": 121.82195999999999, "r_x2": 286.36508, "r_y2": 112.91540999999995, "r_x3": 50.112, "r_y3": 112.91540999999995, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 133.77697999999998, "r_x1": 286.36508, "r_y1": 133.77697999999998, "r_x2": 286.36508, "r_y2": 124.87041999999997, "r_x3": 50.112, "r_y3": 124.87041999999997, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 145.73297000000002, "r_x1": 286.36511, "r_y1": 145.73297000000002, "r_x2": 286.36511, "r_y2": 136.82641999999998, "r_x3": 50.112, "r_y3": 136.82641999999998, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 157.68799, "r_x1": 286.36511, "r_y1": 157.68799, "r_x2": 286.36511, "r_y2": 148.78143, "r_x3": 50.112, "r_y3": 148.78143, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 169.64301, "r_x1": 286.36508, "r_y1": 169.64301, "r_x2": 286.36508, "r_y2": 160.73645, "r_x3": 50.112, "r_y3": 160.73645, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 181.59802000000002, "r_x1": 286.36505, "r_y1": 181.59802000000002, "r_x2": 286.36505, "r_y2": 172.69146999999998, "r_x3": 50.112, "r_y3": 172.69146999999998, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 193.55304, "r_x1": 286.36508, "r_y1": 193.55304, "r_x2": 286.36508, "r_y2": 184.64648, "r_x3": 50.112, "r_y3": 184.64648, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 205.50903000000005, "r_x1": 286.36508, "r_y1": 205.50903000000005, "r_x2": 286.36508, "r_y2": 196.60248, "r_x3": 50.112, "r_y3": 196.60248, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 217.46405000000004, "r_x1": 286.36508, "r_y1": 217.46405000000004, "r_x2": 286.36508, "r_y2": 208.5575, "r_x3": 50.112, "r_y3": 208.5575, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 229.41907000000003, "r_x1": 286.36511, "r_y1": 229.41907000000003, "r_x2": 286.36511, "r_y2": 220.51251000000002, "r_x3": 50.112, "r_y3": 220.51251000000002, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 241.37408000000005, "r_x1": 286.36508, "r_y1": 241.37408000000005, "r_x2": 286.36508, "r_y2": 232.46753, "r_x3": 50.112, "r_y3": 232.46753, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 253.32910000000004, "r_x1": 286.36508, "r_y1": 253.32910000000004, "r_x2": 286.36508, "r_y2": 244.42255, "r_x3": 50.112, "r_y3": 244.42255, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 265.28412000000003, "r_x1": 286.36505, "r_y1": 265.28412000000003, "r_x2": 286.36505, "r_y2": 256.37756, "r_x3": 50.112, "r_y3": 256.37756, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 277.24010999999996, "r_x1": 286.36505, "r_y1": 277.24010999999996, "r_x2": 286.36505, "r_y2": 268.33356000000003, "r_x3": 50.112, "r_y3": 268.33356000000003, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 289.1951, "r_x1": 68.652397, "r_y1": 289.1951, "r_x2": 68.652397, "r_y2": 280.28853999999995, "r_x3": 50.112, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.566444, "r_y0": 289.1951, "r_x1": 286.36514, "r_y1": 289.1951, "r_x2": 286.36514, "r_y2": 280.28853999999995, "r_x3": 75.566444, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 301.15009, "r_x1": 286.36511, "r_y1": 301.15009, "r_x2": 286.36511, "r_y2": 292.24353, "r_x3": 50.112, "r_y3": 292.24353, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 313.10507, "r_x1": 75.695961, "r_y1": 313.10507, "r_x2": 75.695961, "r_y2": 304.19852000000003, "r_x3": 50.112, "r_y3": 304.19852000000003, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 326.90207, "r_x1": 286.36499, "r_y1": 326.90207, "r_x2": 286.36499, "r_y2": 317.99550999999997, "r_x3": 62.067001, "r_y3": 317.99550999999997, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 338.8580600000001, "r_x1": 286.36511, "r_y1": 338.8580600000001, "r_x2": 286.36511, "r_y2": 329.95151, "r_x3": 50.112, "r_y3": 329.95151, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 350.81305, "r_x1": 286.36502, "r_y1": 350.81305, "r_x2": 286.36502, "r_y2": 341.90649, "r_x3": 50.112, "r_y3": 341.90649, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 362.76804, "r_x1": 286.36505, "r_y1": 362.76804, "r_x2": 286.36505, "r_y2": 353.8614799999999, "r_x3": 50.112, "r_y3": 353.8614799999999, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 374.72301999999996, "r_x1": 286.36508, "r_y1": 374.72301999999996, "r_x2": 286.36508, "r_y2": 365.81647, "r_x3": 50.112, "r_y3": 365.81647, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 386.67801, "r_x1": 141.58859, "r_y1": 386.67801, "r_x2": 141.58859, "r_y2": 377.77145, "r_x3": 50.112, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.70189, "r_y0": 386.67801, "r_x1": 286.36508, "r_y1": 386.67801, "r_x2": 286.36508, "r_y2": 377.77145, "r_x3": 148.70189, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 398.63300000000004, "r_x1": 286.36508, "r_y1": 398.63300000000004, "r_x2": 286.36508, "r_y2": 389.72644, "r_x3": 50.112, "r_y3": 389.72644, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 410.58899, "r_x1": 286.36511, "r_y1": 410.58899, "r_x2": 286.36511, "r_y2": 401.68243, "r_x3": 50.112, "r_y3": 401.68243, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 422.54398, "r_x1": 286.36511, "r_y1": 422.54398, "r_x2": 286.36511, "r_y2": 413.63742, "r_x3": 50.112, "r_y3": 413.63742, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 434.49896, "r_x1": 216.39774, "r_y1": 434.49896, "r_x2": 216.39774, "r_y2": 425.59241, "r_x3": 50.112, "r_y3": 425.59241, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 448.2959599999999, "r_x1": 286.36499, "r_y1": 448.2959599999999, "r_x2": 286.36499, "r_y2": 439.3894, "r_x3": 62.067001, "r_y3": 439.3894, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 460.25095, "r_x1": 172.14388, "r_y1": 460.25095, "r_x2": 172.14388, "r_y2": 451.34439, "r_x3": 50.112, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.14801, "r_y0": 460.02182, "r_x1": 224.70818999999997, "r_y1": 460.02182, "r_x2": 224.70818999999997, "r_y2": 451.43405, "r_x3": 174.14801, "r_y3": 451.43405, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.70801, "r_y0": 460.25095, "r_x1": 286.36655, "r_y1": 460.25095, "r_x2": 286.36655, "r_y2": 451.34439, "r_x3": 224.70801, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 472.20694, "r_x1": 286.36505, "r_y1": 472.20694, "r_x2": 286.36505, "r_y2": 463.30038, "r_x3": 50.112015, "r_y3": 463.30038, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 484.16193, "r_x1": 286.36511, "r_y1": 484.16193, "r_x2": 286.36511, "r_y2": 475.25537, "r_x3": 50.112015, "r_y3": 475.25537, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 496.11691, "r_x1": 286.36511, "r_y1": 496.11691, "r_x2": 286.36511, "r_y2": 487.21036, "r_x3": 50.112015, "r_y3": 487.21036, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 508.0719, "r_x1": 286.36508, "r_y1": 508.0719, "r_x2": 286.36508, "r_y2": 499.16534, "r_x3": 50.112015, "r_y3": 499.16534, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 520.02689, "r_x1": 286.36505, "r_y1": 520.02689, "r_x2": 286.36505, "r_y2": 511.12033, "r_x3": 50.112015, "r_y3": 511.12033, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 531.98288, "r_x1": 286.36508, "r_y1": 531.98288, "r_x2": 286.36508, "r_y2": 523.07632, "r_x3": 50.112015, "r_y3": 523.07632, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 543.93788, "r_x1": 286.36508, "r_y1": 543.93788, "r_x2": 286.36508, "r_y2": 535.0313100000001, "r_x3": 50.112015, "r_y3": 535.0313100000001, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 555.89288, "r_x1": 286.36511, "r_y1": 555.89288, "r_x2": 286.36511, "r_y2": 546.98633, "r_x3": 50.112015, "r_y3": 546.98633, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 567.84789, "r_x1": 286.36508, "r_y1": 567.84789, "r_x2": 286.36508, "r_y2": 558.94133, "r_x3": 50.112015, "r_y3": 558.94133, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 579.8028899999999, "r_x1": 286.36511, "r_y1": 579.8028899999999, "r_x2": 286.36511, "r_y2": 570.89633, "r_x3": 50.112015, "r_y3": 570.89633, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 591.75789, "r_x1": 286.36511, "r_y1": 591.75789, "r_x2": 286.36511, "r_y2": 582.85133, "r_x3": 50.112015, "r_y3": 582.85133, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 603.71388, "r_x1": 286.36505, "r_y1": 603.71388, "r_x2": 286.36505, "r_y2": 594.80733, "r_x3": 50.112015, "r_y3": 594.80733, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 615.6688800000001, "r_x1": 286.36508, "r_y1": 615.6688800000001, "r_x2": 286.36508, "r_y2": 606.76233, "r_x3": 50.112015, "r_y3": 606.76233, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 627.62389, "r_x1": 209.7527, "r_y1": 627.62389, "r_x2": 209.7527, "r_y2": 618.71733, "r_x3": 50.112015, "r_y3": 618.71733, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067017, "r_y0": 641.42088, "r_x1": 286.36499, "r_y1": 641.42088, "r_x2": 286.36499, "r_y2": 632.51433, "r_x3": 62.067017, "r_y3": 632.51433, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 653.37589, "r_x1": 286.36508, "r_y1": 653.37589, "r_x2": 286.36508, "r_y2": 644.46933, "r_x3": 50.112015, "r_y3": 644.46933, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.33189, "r_x1": 286.36511, "r_y1": 665.33189, "r_x2": 286.36511, "r_y2": 656.42532, "r_x3": 50.112015, "r_y3": 656.42532, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28689, "r_x1": 286.36505, "r_y1": 677.28689, "r_x2": 286.36505, "r_y2": 668.38033, "r_x3": 50.112015, "r_y3": 668.38033, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24189, "r_x1": 286.36508, "r_y1": 689.24189, "r_x2": 286.36508, "r_y2": 680.33533, "r_x3": 50.112015, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.196892, "r_x1": 286.36508, "r_y1": 701.196892, "r_x2": 286.36508, "r_y2": 692.290329, "r_x3": 50.112015, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151894, "r_x1": 286.36511, "r_y1": 713.151894, "r_x2": 286.36511, "r_y2": 704.245331, "r_x3": 50.112015, "r_y3": 704.245331, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 176.56793000000005, "r_x1": 344.6178, "r_y1": 176.56793000000005, "r_x2": 344.6178, "r_y2": 167.66138, "r_x3": 308.862, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.07602, "r_y0": 176.56793000000005, "r_x1": 380.45328, "r_y1": 176.56793000000005, "r_x2": 380.45328, "r_y2": 167.66138, "r_x3": 361.07602, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.56799, "r_y0": 176.33880999999997, "r_x1": 468.67974999999996, "r_y1": 176.33880999999997, "r_x2": 468.67974999999996, "r_y2": 167.75104, "r_x3": 386.56799, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.79599, "r_y0": 176.56793000000005, "r_x1": 489.18198, "r_y1": 176.56793000000005, "r_x2": 489.18198, "r_y2": 167.66138, "r_x3": 474.79599, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.29898000000003, "r_y0": 176.33880999999997, "r_x1": 545.112, "r_y1": 176.33880999999997, "r_x2": 545.112, "r_y2": 167.75104, "r_x3": 495.29898000000003, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 188.29381999999998, "r_x1": 341.16077, "r_y1": 188.29381999999998, "r_x2": 341.16077, "r_y2": 179.70605, "r_x3": 308.862, "r_y3": 179.70605, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.457, "r_y0": 188.52295000000004, "r_x1": 545.11005, "r_y1": 188.52295000000004, "r_x2": 545.11005, "r_y2": 179.61639000000002, "r_x3": 343.457, "r_y3": 179.61639000000002, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 200.47797000000003, "r_x1": 545.11505, "r_y1": 200.47797000000003, "r_x2": 545.11505, "r_y2": 191.57141000000001, "r_x3": 308.862, "r_y3": 191.57141000000001, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 212.43298000000004, "r_x1": 545.11499, "r_y1": 212.43298000000004, "r_x2": 545.11499, "r_y2": 203.52643, "r_x3": 308.862, "r_y3": 203.52643, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 224.38897999999995, "r_x1": 523.93469, "r_y1": 224.38897999999995, "r_x2": 523.93469, "r_y2": 215.48242000000005, "r_x3": 308.862, "r_y3": 215.48242000000005, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.52698, "r_x1": 545.11517, "r_y1": 258.52698, "r_x2": 545.11517, "r_y2": 249.62041999999997, "r_x3": 308.862, "r_y3": 249.62041999999997, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.48199, "r_x1": 545.11517, "r_y1": 270.48199, "r_x2": 545.11517, "r_y2": 261.57543999999996, "r_x3": 308.862, "r_y3": 261.57543999999996, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.43698, "r_x1": 545.11505, "r_y1": 282.43698, "r_x2": 545.11505, "r_y2": 273.5304, "r_x3": 308.862, "r_y3": 273.5304, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.39197, "r_x1": 436.82169, "r_y1": 294.39197, "r_x2": 436.82169, "r_y2": 285.48541000000006, "r_x3": 308.862, "r_y3": 285.48541000000006, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 306.67896, "r_x1": 542.74396, "r_y1": 306.67896, "r_x2": 542.74396, "r_y2": 297.77240000000006, "r_x3": 320.81699, "r_y3": 297.77240000000006, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 331.93167000000005, "r_x1": 316.28476, "r_y1": 331.93167000000005, "r_x2": 316.28476, "r_y2": 321.18396, "r_x3": 308.862, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18176, "r_y0": 331.93167000000005, "r_x1": 444.93607000000003, "r_y1": 331.93167000000005, "r_x2": 444.93607000000003, "r_y2": 321.18396, "r_x3": 326.18176, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 350.84594999999996, "r_x1": 545.11499, "r_y1": 350.84594999999996, "r_x2": 545.11499, "r_y2": 341.93939, "r_x3": 320.81699, "r_y3": 341.93939, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 362.80092999999994, "r_x1": 545.11511, "r_y1": 362.80092999999994, "r_x2": 545.11511, "r_y2": 353.89438, "r_x3": 308.862, "r_y3": 353.89438, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 374.75592, "r_x1": 545.11517, "r_y1": 374.75592, "r_x2": 545.11517, "r_y2": 365.84937, "r_x3": 308.862, "r_y3": 365.84937, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 386.71091, "r_x1": 545.11505, "r_y1": 386.71091, "r_x2": 545.11505, "r_y2": 377.80435, "r_x3": 308.862, "r_y3": 377.80435, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 398.66588999999993, "r_x1": 545.11517, "r_y1": 398.66588999999993, "r_x2": 545.11517, "r_y2": 389.75934000000007, "r_x3": 308.862, "r_y3": 389.75934000000007, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 410.62088, "r_x1": 545.11523, "r_y1": 410.62088, "r_x2": 545.11523, "r_y2": 401.71432000000004, "r_x3": 308.862, "r_y3": 401.71432000000004, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 422.57687, "r_x1": 545.11517, "r_y1": 422.57687, "r_x2": 545.11517, "r_y2": 413.67032, "r_x3": 308.862, "r_y3": 413.67032, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 434.53186, "r_x1": 545.11505, "r_y1": 434.53186, "r_x2": 545.11505, "r_y2": 425.62531, "r_x3": 308.862, "r_y3": 425.62531, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 446.48685000000006, "r_x1": 437.9375, "r_y1": 446.48685000000006, "r_x2": 437.9375, "r_y2": 437.58029, "r_x3": 308.862, "r_y3": 437.58029, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 467.54633, "r_x1": 323.14081, "r_y1": 467.54633, "r_x2": 323.14081, "r_y2": 457.69427, "r_x3": 308.862, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66003, "r_y0": 467.54633, "r_x1": 420.16058, "r_y1": 467.54633, "r_x2": 420.16058, "r_y2": 457.69427, "r_x3": 332.66003, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 485.67184, "r_x1": 545.11487, "r_y1": 485.67184, "r_x2": 545.11487, "r_y2": 476.76529, "r_x3": 320.81699, "r_y3": 476.76529, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.62683, "r_x1": 509.02054, "r_y1": 497.62683, "r_x2": 509.02054, "r_y2": 488.72028, "r_x3": 308.862, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.58588, "r_y0": 497.62683, "r_x1": 523.05786, "r_y1": 497.62683, "r_x2": 523.05786, "r_y2": 488.72028, "r_x3": 515.58588, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 497.62683, "r_x1": 545.11505, "r_y1": 497.62683, "r_x2": 545.11505, "r_y2": 488.72028, "r_x3": 529.62323, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 509.35269, "r_x1": 406.34601, "r_y1": 509.35269, "r_x2": 406.34601, "r_y2": 500.76492, "r_x3": 308.862, "r_y3": 500.76492, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87201, "r_y0": 509.58182, "r_x1": 545.1106, "r_y1": 509.58182, "r_x2": 545.1106, "r_y2": 500.67526, "r_x3": 408.87201, "r_y3": 500.67526, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 521.53781, "r_x1": 409.39459, "r_y1": 521.53781, "r_x2": 409.39459, "r_y2": 512.63126, "r_x3": 308.862, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.72705, "r_y0": 521.53781, "r_x1": 545.11505, "r_y1": 521.53781, "r_x2": 545.11505, "r_y2": 512.63126, "r_x3": 416.72705, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.4928, "r_x1": 436.194, "r_y1": 533.4928, "r_x2": 436.194, "r_y2": 524.58624, "r_x3": 308.862, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.526, "r_y0": 533.26367, "r_x1": 513.86694, "r_y1": 533.26367, "r_x2": 513.86694, "r_y2": 524.6759, "r_x3": 439.526, "r_y3": 524.6759, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43201, "r_y0": 533.4928, "r_x1": 545.10815, "r_y1": 533.4928, "r_x2": 545.10815, "r_y2": 524.58624, "r_x3": 517.43201, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.4478, "r_x1": 545.11511, "r_y1": 545.4478, "r_x2": 545.11511, "r_y2": 536.54124, "r_x3": 308.862, "r_y3": 536.54124, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.4028000000001, "r_x1": 358.5455, "r_y1": 557.4028000000001, "r_x2": 358.5455, "r_y2": 548.49625, "r_x3": 308.862, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19055, "r_y0": 557.4028000000001, "r_x1": 545.11517, "r_y1": 557.4028000000001, "r_x2": 545.11517, "r_y2": 548.49625, "r_x3": 365.19055, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.3578, "r_x1": 352.40851, "r_y1": 569.3578, "r_x2": 352.40851, "r_y2": 560.45125, "r_x3": 308.862, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.409, "r_y0": 569.13863, "r_x1": 360.1579, "r_y1": 569.13863, "r_x2": 360.1579, "r_y2": 560.29184, "r_x3": 352.409, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.15799, "r_y0": 569.3578, "r_x1": 367.90891, "r_y1": 569.3578, "r_x2": 367.90891, "r_y2": 560.45125, "r_x3": 360.15799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.909, "r_y0": 569.13863, "r_x1": 375.6579, "r_y1": 569.13863, "r_x2": 375.6579, "r_y2": 560.29184, "r_x3": 367.909, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.65799, "r_y0": 569.3578, "r_x1": 545.11182, "r_y1": 569.3578, "r_x2": 545.11182, "r_y2": 560.45125, "r_x3": 375.65799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.3138, "r_x1": 545.11499, "r_y1": 581.3138, "r_x2": 545.11499, "r_y2": 572.40724, "r_x3": 308.862, "r_y3": 572.40724, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.2688, "r_x1": 483.11768, "r_y1": 593.2688, "r_x2": 483.11768, "r_y2": 584.3622399999999, "r_x3": 308.862, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 593.04962, "r_x1": 490.86792, "r_y1": 593.04962, "r_x2": 490.86792, "r_y2": 584.20284, "r_x3": 483.11902, "r_y3": 584.20284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.86800999999997, "r_y0": 593.2688, "r_x1": 545.11438, "r_y1": 593.2688, "r_x2": 545.11438, "r_y2": 584.3622399999999, "r_x3": 490.86800999999997, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2238, "r_x1": 545.11493, "r_y1": 605.2238, "r_x2": 545.11493, "r_y2": 596.31725, "r_x3": 308.862, "r_y3": 596.31725, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.1788, "r_x1": 329.64395, "r_y1": 617.1788, "r_x2": 329.64395, "r_y2": 608.27225, "r_x3": 308.862, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.646, "r_y0": 616.9596300000001, "r_x1": 337.3949, "r_y1": 616.9596300000001, "r_x2": 337.3949, "r_y2": 608.11284, "r_x3": 329.646, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39398, "r_y0": 617.1788, "r_x1": 468.5914, "r_y1": 617.1788, "r_x2": 468.5914, "r_y2": 608.27225, "r_x3": 337.39398, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59496999999993, "r_y0": 616.9596300000001, "r_x1": 476.34387000000004, "r_y1": 616.9596300000001, "r_x2": 476.34387000000004, "r_y2": 608.11284, "r_x3": 468.59496999999993, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.3439599999999, "r_y0": 617.1788, "r_x1": 545.11572, "r_y1": 617.1788, "r_x2": 545.11572, "r_y2": 608.27225, "r_x3": 476.3439599999999, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.1338000000001, "r_x1": 545.11499, "r_y1": 629.1338000000001, "r_x2": 545.11499, "r_y2": 620.22725, "r_x3": 308.86197, "r_y3": 620.22725, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.08881, "r_x1": 545.11517, "r_y1": 641.08881, "r_x2": 545.11517, "r_y2": 632.1822500000001, "r_x3": 308.86197, "r_y3": 632.1822500000001, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.0448, "r_x1": 545.11511, "r_y1": 653.0448, "r_x2": 545.11511, "r_y2": 644.13824, "r_x3": 308.86197, "r_y3": 644.13824, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 664.99981, "r_x1": 449.42432, "r_y1": 664.99981, "r_x2": 449.42432, "r_y2": 656.09325, "r_x3": 308.86197, "r_y3": 656.09325, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 677.21707, "r_x1": 431.90985, "r_y1": 677.21707, "r_x2": 431.90985, "r_y2": 668.2607, "r_x3": 320.81696, "r_y3": 668.2607, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.49896, "r_y0": 677.2868100000001, "r_x1": 545.11255, "r_y1": 677.2868100000001, "r_x2": 545.11255, "r_y2": 668.3802499999999, "r_x3": 439.49896, "r_y3": 668.3802499999999, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 689.24181, "r_x1": 545.11499, "r_y1": 689.24181, "r_x2": 545.11499, "r_y2": 680.33525, "r_x3": 308.86197, "r_y3": 680.33525, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 701.196815, "r_x1": 545.11511, "r_y1": 701.196815, "r_x2": 545.11511, "r_y2": 692.290253, "r_x3": 308.86197, "r_y3": 692.290253, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 713.1518169999999, "r_x1": 545.11505, "r_y1": 713.1518169999999, "r_x2": 545.11505, "r_y2": 704.245255, "r_x3": 308.86197, "r_y3": 704.245255, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12097, "r_y0": 743.039814, "r_x1": 300.10226, "r_y1": 743.039814, "r_x2": 300.10226, "r_y2": 734.133251, "r_x3": 295.12097, "r_y3": 734.133251, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36511, "b": 96.06994999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9611433148384094, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36511, "r_y1": 84.11492999999996, "r_x2": 286.36511, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 212.28319, "r_y1": 96.06994999999995, "r_x2": 212.28319, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 100.96038999999996, "r": 286.36514, "b": 313.10507, "coord_origin": "TOPLEFT" }, "confidence": 0.988013744354248, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 109.86694, "r_x1": 286.36502, "r_y1": 109.86694, "r_x2": 286.36502, "r_y2": 100.96038999999996, "r_x3": 62.067001, "r_y3": 100.96038999999996, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 121.82195999999999, "r_x1": 286.36508, "r_y1": 121.82195999999999, "r_x2": 286.36508, "r_y2": 112.91540999999995, "r_x3": 50.112, "r_y3": 112.91540999999995, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 133.77697999999998, "r_x1": 286.36508, "r_y1": 133.77697999999998, "r_x2": 286.36508, "r_y2": 124.87041999999997, "r_x3": 50.112, "r_y3": 124.87041999999997, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 145.73297000000002, "r_x1": 286.36511, "r_y1": 145.73297000000002, "r_x2": 286.36511, "r_y2": 136.82641999999998, "r_x3": 50.112, "r_y3": 136.82641999999998, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 157.68799, "r_x1": 286.36511, "r_y1": 157.68799, "r_x2": 286.36511, "r_y2": 148.78143, "r_x3": 50.112, "r_y3": 148.78143, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 169.64301, "r_x1": 286.36508, "r_y1": 169.64301, "r_x2": 286.36508, "r_y2": 160.73645, "r_x3": 50.112, "r_y3": 160.73645, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 181.59802000000002, "r_x1": 286.36505, "r_y1": 181.59802000000002, "r_x2": 286.36505, "r_y2": 172.69146999999998, "r_x3": 50.112, "r_y3": 172.69146999999998, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 193.55304, "r_x1": 286.36508, "r_y1": 193.55304, "r_x2": 286.36508, "r_y2": 184.64648, "r_x3": 50.112, "r_y3": 184.64648, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 205.50903000000005, "r_x1": 286.36508, "r_y1": 205.50903000000005, "r_x2": 286.36508, "r_y2": 196.60248, "r_x3": 50.112, "r_y3": 196.60248, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 217.46405000000004, "r_x1": 286.36508, "r_y1": 217.46405000000004, "r_x2": 286.36508, "r_y2": 208.5575, "r_x3": 50.112, "r_y3": 208.5575, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 229.41907000000003, "r_x1": 286.36511, "r_y1": 229.41907000000003, "r_x2": 286.36511, "r_y2": 220.51251000000002, "r_x3": 50.112, "r_y3": 220.51251000000002, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 241.37408000000005, "r_x1": 286.36508, "r_y1": 241.37408000000005, "r_x2": 286.36508, "r_y2": 232.46753, "r_x3": 50.112, "r_y3": 232.46753, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 253.32910000000004, "r_x1": 286.36508, "r_y1": 253.32910000000004, "r_x2": 286.36508, "r_y2": 244.42255, "r_x3": 50.112, "r_y3": 244.42255, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 265.28412000000003, "r_x1": 286.36505, "r_y1": 265.28412000000003, "r_x2": 286.36505, "r_y2": 256.37756, "r_x3": 50.112, "r_y3": 256.37756, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 277.24010999999996, "r_x1": 286.36505, "r_y1": 277.24010999999996, "r_x2": 286.36505, "r_y2": 268.33356000000003, "r_x3": 50.112, "r_y3": 268.33356000000003, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 289.1951, "r_x1": 68.652397, "r_y1": 289.1951, "r_x2": 68.652397, "r_y2": 280.28853999999995, "r_x3": 50.112, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.566444, "r_y0": 289.1951, "r_x1": 286.36514, "r_y1": 289.1951, "r_x2": 286.36514, "r_y2": 280.28853999999995, "r_x3": 75.566444, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 301.15009, "r_x1": 286.36511, "r_y1": 301.15009, "r_x2": 286.36511, "r_y2": 292.24353, "r_x3": 50.112, "r_y3": 292.24353, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 313.10507, "r_x1": 75.695961, "r_y1": 313.10507, "r_x2": 75.695961, "r_y2": 304.19852000000003, "r_x3": 50.112, "r_y3": 304.19852000000003, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 317.99550999999997, "r": 286.36511, "b": 434.49896, "coord_origin": "TOPLEFT" }, "confidence": 0.9873981475830078, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 326.90207, "r_x1": 286.36499, "r_y1": 326.90207, "r_x2": 286.36499, "r_y2": 317.99550999999997, "r_x3": 62.067001, "r_y3": 317.99550999999997, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 338.8580600000001, "r_x1": 286.36511, "r_y1": 338.8580600000001, "r_x2": 286.36511, "r_y2": 329.95151, "r_x3": 50.112, "r_y3": 329.95151, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 350.81305, "r_x1": 286.36502, "r_y1": 350.81305, "r_x2": 286.36502, "r_y2": 341.90649, "r_x3": 50.112, "r_y3": 341.90649, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 362.76804, "r_x1": 286.36505, "r_y1": 362.76804, "r_x2": 286.36505, "r_y2": 353.8614799999999, "r_x3": 50.112, "r_y3": 353.8614799999999, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 374.72301999999996, "r_x1": 286.36508, "r_y1": 374.72301999999996, "r_x2": 286.36508, "r_y2": 365.81647, "r_x3": 50.112, "r_y3": 365.81647, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 386.67801, "r_x1": 141.58859, "r_y1": 386.67801, "r_x2": 141.58859, "r_y2": 377.77145, "r_x3": 50.112, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.70189, "r_y0": 386.67801, "r_x1": 286.36508, "r_y1": 386.67801, "r_x2": 286.36508, "r_y2": 377.77145, "r_x3": 148.70189, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 398.63300000000004, "r_x1": 286.36508, "r_y1": 398.63300000000004, "r_x2": 286.36508, "r_y2": 389.72644, "r_x3": 50.112, "r_y3": 389.72644, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 410.58899, "r_x1": 286.36511, "r_y1": 410.58899, "r_x2": 286.36511, "r_y2": 401.68243, "r_x3": 50.112, "r_y3": 401.68243, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 422.54398, "r_x1": 286.36511, "r_y1": 422.54398, "r_x2": 286.36511, "r_y2": 413.63742, "r_x3": 50.112, "r_y3": 413.63742, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 434.49896, "r_x1": 216.39774, "r_y1": 434.49896, "r_x2": 216.39774, "r_y2": 425.59241, "r_x3": 50.112, "r_y3": 425.59241, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.112, "t": 439.3894, "r": 286.36655, "b": 627.62389, "coord_origin": "TOPLEFT" }, "confidence": 0.9876030087471008, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 448.2959599999999, "r_x1": 286.36499, "r_y1": 448.2959599999999, "r_x2": 286.36499, "r_y2": 439.3894, "r_x3": 62.067001, "r_y3": 439.3894, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 460.25095, "r_x1": 172.14388, "r_y1": 460.25095, "r_x2": 172.14388, "r_y2": 451.34439, "r_x3": 50.112, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.14801, "r_y0": 460.02182, "r_x1": 224.70818999999997, "r_y1": 460.02182, "r_x2": 224.70818999999997, "r_y2": 451.43405, "r_x3": 174.14801, "r_y3": 451.43405, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.70801, "r_y0": 460.25095, "r_x1": 286.36655, "r_y1": 460.25095, "r_x2": 286.36655, "r_y2": 451.34439, "r_x3": 224.70801, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 472.20694, "r_x1": 286.36505, "r_y1": 472.20694, "r_x2": 286.36505, "r_y2": 463.30038, "r_x3": 50.112015, "r_y3": 463.30038, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 484.16193, "r_x1": 286.36511, "r_y1": 484.16193, "r_x2": 286.36511, "r_y2": 475.25537, "r_x3": 50.112015, "r_y3": 475.25537, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 496.11691, "r_x1": 286.36511, "r_y1": 496.11691, "r_x2": 286.36511, "r_y2": 487.21036, "r_x3": 50.112015, "r_y3": 487.21036, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 508.0719, "r_x1": 286.36508, "r_y1": 508.0719, "r_x2": 286.36508, "r_y2": 499.16534, "r_x3": 50.112015, "r_y3": 499.16534, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 520.02689, "r_x1": 286.36505, "r_y1": 520.02689, "r_x2": 286.36505, "r_y2": 511.12033, "r_x3": 50.112015, "r_y3": 511.12033, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 531.98288, "r_x1": 286.36508, "r_y1": 531.98288, "r_x2": 286.36508, "r_y2": 523.07632, "r_x3": 50.112015, "r_y3": 523.07632, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 543.93788, "r_x1": 286.36508, "r_y1": 543.93788, "r_x2": 286.36508, "r_y2": 535.0313100000001, "r_x3": 50.112015, "r_y3": 535.0313100000001, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 555.89288, "r_x1": 286.36511, "r_y1": 555.89288, "r_x2": 286.36511, "r_y2": 546.98633, "r_x3": 50.112015, "r_y3": 546.98633, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 567.84789, "r_x1": 286.36508, "r_y1": 567.84789, "r_x2": 286.36508, "r_y2": 558.94133, "r_x3": 50.112015, "r_y3": 558.94133, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 579.8028899999999, "r_x1": 286.36511, "r_y1": 579.8028899999999, "r_x2": 286.36511, "r_y2": 570.89633, "r_x3": 50.112015, "r_y3": 570.89633, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 591.75789, "r_x1": 286.36511, "r_y1": 591.75789, "r_x2": 286.36511, "r_y2": 582.85133, "r_x3": 50.112015, "r_y3": 582.85133, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 603.71388, "r_x1": 286.36505, "r_y1": 603.71388, "r_x2": 286.36505, "r_y2": 594.80733, "r_x3": 50.112015, "r_y3": 594.80733, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 615.6688800000001, "r_x1": 286.36508, "r_y1": 615.6688800000001, "r_x2": 286.36508, "r_y2": 606.76233, "r_x3": 50.112015, "r_y3": 606.76233, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 627.62389, "r_x1": 209.7527, "r_y1": 627.62389, "r_x2": 209.7527, "r_y2": 618.71733, "r_x3": 50.112015, "r_y3": 618.71733, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "text", "bbox": { "l": 50.112015, "t": 632.51433, "r": 286.36511, "b": 713.151894, "coord_origin": "TOPLEFT" }, "confidence": 0.9871614575386047, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067017, "r_y0": 641.42088, "r_x1": 286.36499, "r_y1": 641.42088, "r_x2": 286.36499, "r_y2": 632.51433, "r_x3": 62.067017, "r_y3": 632.51433, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 653.37589, "r_x1": 286.36508, "r_y1": 653.37589, "r_x2": 286.36508, "r_y2": 644.46933, "r_x3": 50.112015, "r_y3": 644.46933, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.33189, "r_x1": 286.36511, "r_y1": 665.33189, "r_x2": 286.36511, "r_y2": 656.42532, "r_x3": 50.112015, "r_y3": 656.42532, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28689, "r_x1": 286.36505, "r_y1": 677.28689, "r_x2": 286.36505, "r_y2": 668.38033, "r_x3": 50.112015, "r_y3": 668.38033, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24189, "r_x1": 286.36508, "r_y1": 689.24189, "r_x2": 286.36508, "r_y2": 680.33533, "r_x3": 50.112015, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.196892, "r_x1": 286.36508, "r_y1": 701.196892, "r_x2": 286.36508, "r_y2": 692.290329, "r_x3": 50.112015, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151894, "r_x1": 286.36511, "r_y1": 713.151894, "r_x2": 286.36511, "r_y2": 704.245331, "r_x3": 50.112015, "r_y3": 704.245331, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT" }, "confidence": 0.9777463674545288, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.332, "t": 73.61437999999998, "r": 430.90231, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.85742, "t": 73.61437999999998, "r": 464.4463799999999, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.78632, "t": 73.61437999999998, "r": 494.94193, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28186, "t": 73.61437999999998, "r": 536.91437, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.9673499999999, "r": 361.64264, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.85599, "t": 85.6684600000001, "r": 425.37775, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.89569, "t": 85.6684600000001, "r": 457.41745000000003, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.401, "t": 85.9673499999999, "r": 496.3262, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63495, "t": 85.9673499999999, "r": 532.56012, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92236000000003, "r": 359.43094, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.85599, "t": 97.62347, "r": 425.37775, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.89569, "t": 97.62347, "r": 457.41745000000003, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.401, "t": 97.92236000000003, "r": 496.3262, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46185, "t": 97.92236000000003, "r": 531.73328, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.87836000000004, "r": 359.97888, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.85599, "t": 109.57947000000001, "r": 425.37775, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81226, "t": 109.57947000000001, "r": 456.50091999999995, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.401, "t": 109.87836000000004, "r": 496.3262, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25017999999994, "t": 109.87836000000004, "r": 533.94501, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83336999999995, "r": 400.37723, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.85599, "t": 121.53448000000003, "r": 425.37775, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.89569, "t": 121.53448000000003, "r": 457.41745000000003, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.401, "t": 121.83336999999995, "r": 496.3262, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63495, "t": 121.83336999999995, "r": 532.56012, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.78839000000005, "r": 375.17184, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.85599, "t": 133.48950000000002, "r": 425.37775, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.89569, "t": 133.48950000000002, "r": 457.41745000000003, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.401, "t": 133.78839000000005, "r": 496.3262, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63495, "t": 133.78839000000005, "r": 532.56012, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74341000000004, "r": 369.39352, "b": 154.64995999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.85599, "t": 145.44446000000005, "r": 425.37775, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.89569, "t": 145.44446000000005, "r": 457.41745000000003, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.401, "t": 145.74334999999996, "r": 496.3262, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63495, "t": 145.74334999999996, "r": 532.56012, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 9, "label": "caption", "bbox": { "l": 308.862, "t": 167.66138, "r": 545.11505, "b": 224.38897999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9667726755142212, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 176.56793000000005, "r_x1": 344.6178, "r_y1": 176.56793000000005, "r_x2": 344.6178, "r_y2": 167.66138, "r_x3": 308.862, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.07602, "r_y0": 176.56793000000005, "r_x1": 380.45328, "r_y1": 176.56793000000005, "r_x2": 380.45328, "r_y2": 167.66138, "r_x3": 361.07602, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.56799, "r_y0": 176.33880999999997, "r_x1": 468.67974999999996, "r_y1": 176.33880999999997, "r_x2": 468.67974999999996, "r_y2": 167.75104, "r_x3": 386.56799, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.79599, "r_y0": 176.56793000000005, "r_x1": 489.18198, "r_y1": 176.56793000000005, "r_x2": 489.18198, "r_y2": 167.66138, "r_x3": 474.79599, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.29898000000003, "r_y0": 176.33880999999997, "r_x1": 545.112, "r_y1": 176.33880999999997, "r_x2": 545.112, "r_y2": 167.75104, "r_x3": 495.29898000000003, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 188.29381999999998, "r_x1": 341.16077, "r_y1": 188.29381999999998, "r_x2": 341.16077, "r_y2": 179.70605, "r_x3": 308.862, "r_y3": 179.70605, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.457, "r_y0": 188.52295000000004, "r_x1": 545.11005, "r_y1": 188.52295000000004, "r_x2": 545.11005, "r_y2": 179.61639000000002, "r_x3": 343.457, "r_y3": 179.61639000000002, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 200.47797000000003, "r_x1": 545.11505, "r_y1": 200.47797000000003, "r_x2": 545.11505, "r_y2": 191.57141000000001, "r_x3": 308.862, "r_y3": 191.57141000000001, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 212.43298000000004, "r_x1": 545.11499, "r_y1": 212.43298000000004, "r_x2": 545.11499, "r_y2": 203.52643, "r_x3": 308.862, "r_y3": 203.52643, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 224.38897999999995, "r_x1": 523.93469, "r_y1": 224.38897999999995, "r_x2": 523.93469, "r_y2": 215.48242000000005, "r_x3": 308.862, "r_y3": 215.48242000000005, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 308.862, "t": 249.62041999999997, "r": 545.11517, "b": 294.39197, "coord_origin": "TOPLEFT" }, "confidence": 0.978954017162323, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.52698, "r_x1": 545.11517, "r_y1": 258.52698, "r_x2": 545.11517, "r_y2": 249.62041999999997, "r_x3": 308.862, "r_y3": 249.62041999999997, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.48199, "r_x1": 545.11517, "r_y1": 270.48199, "r_x2": 545.11517, "r_y2": 261.57543999999996, "r_x3": 308.862, "r_y3": 261.57543999999996, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.43698, "r_x1": 545.11505, "r_y1": 282.43698, "r_x2": 545.11505, "r_y2": 273.5304, "r_x3": 308.862, "r_y3": 273.5304, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.39197, "r_x1": 436.82169, "r_y1": 294.39197, "r_x2": 436.82169, "r_y2": 285.48541000000006, "r_x3": 308.862, "r_y3": 285.48541000000006, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 320.81699, "t": 297.77240000000006, "r": 542.74396, "b": 306.67896, "coord_origin": "TOPLEFT" }, "confidence": 0.9043695330619812, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 306.67896, "r_x1": 542.74396, "r_y1": 306.67896, "r_x2": 542.74396, "r_y2": 297.77240000000006, "r_x3": 320.81699, "r_y3": 297.77240000000006, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "section_header", "bbox": { "l": 308.862, "t": 321.18396, "r": 444.93607000000003, "b": 331.93167000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9466595649719238, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 331.93167000000005, "r_x1": 316.28476, "r_y1": 331.93167000000005, "r_x2": 316.28476, "r_y2": 321.18396, "r_x3": 308.862, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18176, "r_y0": 331.93167000000005, "r_x1": 444.93607000000003, "r_y1": 331.93167000000005, "r_x2": 444.93607000000003, "r_y2": 321.18396, "r_x3": 326.18176, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 341.93939, "r": 545.11523, "b": 446.48685000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.9884450435638428, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 350.84594999999996, "r_x1": 545.11499, "r_y1": 350.84594999999996, "r_x2": 545.11499, "r_y2": 341.93939, "r_x3": 320.81699, "r_y3": 341.93939, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 362.80092999999994, "r_x1": 545.11511, "r_y1": 362.80092999999994, "r_x2": 545.11511, "r_y2": 353.89438, "r_x3": 308.862, "r_y3": 353.89438, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 374.75592, "r_x1": 545.11517, "r_y1": 374.75592, "r_x2": 545.11517, "r_y2": 365.84937, "r_x3": 308.862, "r_y3": 365.84937, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 386.71091, "r_x1": 545.11505, "r_y1": 386.71091, "r_x2": 545.11505, "r_y2": 377.80435, "r_x3": 308.862, "r_y3": 377.80435, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 398.66588999999993, "r_x1": 545.11517, "r_y1": 398.66588999999993, "r_x2": 545.11517, "r_y2": 389.75934000000007, "r_x3": 308.862, "r_y3": 389.75934000000007, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 410.62088, "r_x1": 545.11523, "r_y1": 410.62088, "r_x2": 545.11523, "r_y2": 401.71432000000004, "r_x3": 308.862, "r_y3": 401.71432000000004, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 422.57687, "r_x1": 545.11517, "r_y1": 422.57687, "r_x2": 545.11517, "r_y2": 413.67032, "r_x3": 308.862, "r_y3": 413.67032, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 434.53186, "r_x1": 545.11505, "r_y1": 434.53186, "r_x2": 545.11505, "r_y2": 425.62531, "r_x3": 308.862, "r_y3": 425.62531, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 446.48685000000006, "r_x1": 437.9375, "r_y1": 446.48685000000006, "r_x2": 437.9375, "r_y2": 437.58029, "r_x3": 308.862, "r_y3": 437.58029, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "section_header", "bbox": { "l": 308.862, "t": 457.69427, "r": 420.16058, "b": 467.54633, "coord_origin": "TOPLEFT" }, "confidence": 0.937696099281311, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 467.54633, "r_x1": 323.14081, "r_y1": 467.54633, "r_x2": 323.14081, "r_y2": 457.69427, "r_x3": 308.862, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66003, "r_y0": 467.54633, "r_x1": 420.16058, "r_y1": 467.54633, "r_x2": 420.16058, "r_y2": 457.69427, "r_x3": 332.66003, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.86197, "t": 476.76529, "r": 545.11572, "b": 664.99981, "coord_origin": "TOPLEFT" }, "confidence": 0.9878323078155518, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 485.67184, "r_x1": 545.11487, "r_y1": 485.67184, "r_x2": 545.11487, "r_y2": 476.76529, "r_x3": 320.81699, "r_y3": 476.76529, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.62683, "r_x1": 509.02054, "r_y1": 497.62683, "r_x2": 509.02054, "r_y2": 488.72028, "r_x3": 308.862, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.58588, "r_y0": 497.62683, "r_x1": 523.05786, "r_y1": 497.62683, "r_x2": 523.05786, "r_y2": 488.72028, "r_x3": 515.58588, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 497.62683, "r_x1": 545.11505, "r_y1": 497.62683, "r_x2": 545.11505, "r_y2": 488.72028, "r_x3": 529.62323, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 509.35269, "r_x1": 406.34601, "r_y1": 509.35269, "r_x2": 406.34601, "r_y2": 500.76492, "r_x3": 308.862, "r_y3": 500.76492, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87201, "r_y0": 509.58182, "r_x1": 545.1106, "r_y1": 509.58182, "r_x2": 545.1106, "r_y2": 500.67526, "r_x3": 408.87201, "r_y3": 500.67526, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 521.53781, "r_x1": 409.39459, "r_y1": 521.53781, "r_x2": 409.39459, "r_y2": 512.63126, "r_x3": 308.862, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.72705, "r_y0": 521.53781, "r_x1": 545.11505, "r_y1": 521.53781, "r_x2": 545.11505, "r_y2": 512.63126, "r_x3": 416.72705, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.4928, "r_x1": 436.194, "r_y1": 533.4928, "r_x2": 436.194, "r_y2": 524.58624, "r_x3": 308.862, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.526, "r_y0": 533.26367, "r_x1": 513.86694, "r_y1": 533.26367, "r_x2": 513.86694, "r_y2": 524.6759, "r_x3": 439.526, "r_y3": 524.6759, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43201, "r_y0": 533.4928, "r_x1": 545.10815, "r_y1": 533.4928, "r_x2": 545.10815, "r_y2": 524.58624, "r_x3": 517.43201, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.4478, "r_x1": 545.11511, "r_y1": 545.4478, "r_x2": 545.11511, "r_y2": 536.54124, "r_x3": 308.862, "r_y3": 536.54124, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.4028000000001, "r_x1": 358.5455, "r_y1": 557.4028000000001, "r_x2": 358.5455, "r_y2": 548.49625, "r_x3": 308.862, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19055, "r_y0": 557.4028000000001, "r_x1": 545.11517, "r_y1": 557.4028000000001, "r_x2": 545.11517, "r_y2": 548.49625, "r_x3": 365.19055, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.3578, "r_x1": 352.40851, "r_y1": 569.3578, "r_x2": 352.40851, "r_y2": 560.45125, "r_x3": 308.862, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.409, "r_y0": 569.13863, "r_x1": 360.1579, "r_y1": 569.13863, "r_x2": 360.1579, "r_y2": 560.29184, "r_x3": 352.409, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.15799, "r_y0": 569.3578, "r_x1": 367.90891, "r_y1": 569.3578, "r_x2": 367.90891, "r_y2": 560.45125, "r_x3": 360.15799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.909, "r_y0": 569.13863, "r_x1": 375.6579, "r_y1": 569.13863, "r_x2": 375.6579, "r_y2": 560.29184, "r_x3": 367.909, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.65799, "r_y0": 569.3578, "r_x1": 545.11182, "r_y1": 569.3578, "r_x2": 545.11182, "r_y2": 560.45125, "r_x3": 375.65799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.3138, "r_x1": 545.11499, "r_y1": 581.3138, "r_x2": 545.11499, "r_y2": 572.40724, "r_x3": 308.862, "r_y3": 572.40724, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.2688, "r_x1": 483.11768, "r_y1": 593.2688, "r_x2": 483.11768, "r_y2": 584.3622399999999, "r_x3": 308.862, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 593.04962, "r_x1": 490.86792, "r_y1": 593.04962, "r_x2": 490.86792, "r_y2": 584.20284, "r_x3": 483.11902, "r_y3": 584.20284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.86800999999997, "r_y0": 593.2688, "r_x1": 545.11438, "r_y1": 593.2688, "r_x2": 545.11438, "r_y2": 584.3622399999999, "r_x3": 490.86800999999997, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2238, "r_x1": 545.11493, "r_y1": 605.2238, "r_x2": 545.11493, "r_y2": 596.31725, "r_x3": 308.862, "r_y3": 596.31725, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.1788, "r_x1": 329.64395, "r_y1": 617.1788, "r_x2": 329.64395, "r_y2": 608.27225, "r_x3": 308.862, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.646, "r_y0": 616.9596300000001, "r_x1": 337.3949, "r_y1": 616.9596300000001, "r_x2": 337.3949, "r_y2": 608.11284, "r_x3": 329.646, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39398, "r_y0": 617.1788, "r_x1": 468.5914, "r_y1": 617.1788, "r_x2": 468.5914, "r_y2": 608.27225, "r_x3": 337.39398, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59496999999993, "r_y0": 616.9596300000001, "r_x1": 476.34387000000004, "r_y1": 616.9596300000001, "r_x2": 476.34387000000004, "r_y2": 608.11284, "r_x3": 468.59496999999993, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.3439599999999, "r_y0": 617.1788, "r_x1": 545.11572, "r_y1": 617.1788, "r_x2": 545.11572, "r_y2": 608.27225, "r_x3": 476.3439599999999, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.1338000000001, "r_x1": 545.11499, "r_y1": 629.1338000000001, "r_x2": 545.11499, "r_y2": 620.22725, "r_x3": 308.86197, "r_y3": 620.22725, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.08881, "r_x1": 545.11517, "r_y1": 641.08881, "r_x2": 545.11517, "r_y2": 632.1822500000001, "r_x3": 308.86197, "r_y3": 632.1822500000001, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.0448, "r_x1": 545.11511, "r_y1": 653.0448, "r_x2": 545.11511, "r_y2": 644.13824, "r_x3": 308.86197, "r_y3": 644.13824, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 664.99981, "r_x1": 449.42432, "r_y1": 664.99981, "r_x2": 449.42432, "r_y2": 656.09325, "r_x3": 308.86197, "r_y3": 656.09325, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 308.86197, "t": 668.2607, "r": 545.11511, "b": 713.1518169999999, "coord_origin": "TOPLEFT" }, "confidence": 0.978580117225647, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 677.21707, "r_x1": 431.90985, "r_y1": 677.21707, "r_x2": 431.90985, "r_y2": 668.2607, "r_x3": 320.81696, "r_y3": 668.2607, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.49896, "r_y0": 677.2868100000001, "r_x1": 545.11255, "r_y1": 677.2868100000001, "r_x2": 545.11255, "r_y2": 668.3802499999999, "r_x3": 439.49896, "r_y3": 668.3802499999999, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 689.24181, "r_x1": 545.11499, "r_y1": 689.24181, "r_x2": 545.11499, "r_y2": 680.33525, "r_x3": 308.86197, "r_y3": 680.33525, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 701.196815, "r_x1": 545.11511, "r_y1": 701.196815, "r_x2": 545.11511, "r_y2": 692.290253, "r_x3": 308.86197, "r_y3": 692.290253, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 713.1518169999999, "r_x1": 545.11505, "r_y1": 713.1518169999999, "r_x2": 545.11505, "r_y2": 704.245255, "r_x3": 308.86197, "r_y3": 704.245255, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_footer", "bbox": { "l": 295.12097, "t": 734.133251, "r": 300.10226, "b": 743.039814, "coord_origin": "TOPLEFT" }, "confidence": 0.8565718531608582, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12097, "r_y0": 743.039814, "r_x1": 300.10226, "r_y1": 743.039814, "r_x2": 300.10226, "r_y2": 734.133251, "r_x3": 295.12097, "r_y3": 734.133251, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "8": { "label": "table", "id": 8, "page_no": 3, "cluster": { "id": 8, "label": "table", "bbox": { "l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT" }, "confidence": 0.9777463674545288, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.332, "t": 73.61437999999998, "r": 430.90231, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.85742, "t": 73.61437999999998, "r": 464.4463799999999, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.78632, "t": 73.61437999999998, "r": 494.94193, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28186, "t": 73.61437999999998, "r": 536.91437, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.9673499999999, "r": 361.64264, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.85599, "t": 85.6684600000001, "r": 425.37775, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.89569, "t": 85.6684600000001, "r": 457.41745000000003, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.401, "t": 85.9673499999999, "r": 496.3262, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63495, "t": 85.9673499999999, "r": 532.56012, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92236000000003, "r": 359.43094, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.85599, "t": 97.62347, "r": 425.37775, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.89569, "t": 97.62347, "r": 457.41745000000003, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.401, "t": 97.92236000000003, "r": 496.3262, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46185, "t": 97.92236000000003, "r": 531.73328, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.87836000000004, "r": 359.97888, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.85599, "t": 109.57947000000001, "r": 425.37775, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81226, "t": 109.57947000000001, "r": 456.50091999999995, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.401, "t": 109.87836000000004, "r": 496.3262, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25017999999994, "t": 109.87836000000004, "r": 533.94501, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83336999999995, "r": 400.37723, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.85599, "t": 121.53448000000003, "r": 425.37775, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.89569, "t": 121.53448000000003, "r": 457.41745000000003, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.401, "t": 121.83336999999995, "r": 496.3262, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63495, "t": 121.83336999999995, "r": 532.56012, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.78839000000005, "r": 375.17184, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.85599, "t": 133.48950000000002, "r": 425.37775, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.89569, "t": 133.48950000000002, "r": 457.41745000000003, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.401, "t": 133.78839000000005, "r": 496.3262, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63495, "t": 133.78839000000005, "r": 532.56012, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74341000000004, "r": 369.39352, "b": 154.64995999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.85599, "t": 145.44446000000005, "r": 425.37775, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.89569, "t": 145.44446000000005, "r": 457.41745000000003, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.401, "t": 145.74334999999996, "r": 496.3262, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63495, "t": 145.74334999999996, "r": 532.56012, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 412.332, "t": 73.61437999999998, "r": 430.90231, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 442.85742, "t": 73.61437999999998, "r": 464.4463799999999, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 477.78632, "t": 73.61437999999998, "r": 494.94193, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 508.28186, "t": 73.61437999999998, "r": 536.91437, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 85.9673499999999, "r": 361.64264, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 85.6684600000001, "r": 425.37775, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 85.6684600000001, "r": 457.41745000000003, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 85.9673499999999, "r": 496.3262, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 85.9673499999999, "r": 532.56012, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 97.92236000000003, "r": 359.43094, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 97.62347, "r": 425.37775, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 97.62347, "r": 457.41745000000003, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 97.92236000000003, "r": 496.3262, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.46185, "t": 97.92236000000003, "r": 531.73328, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 109.87836000000004, "r": 359.97888, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 109.57947000000001, "r": 425.37775, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 450.81226, "t": 109.57947000000001, "r": 456.50091999999995, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 109.87836000000004, "r": 496.3262, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 511.25017999999994, "t": 109.87836000000004, "r": 533.94501, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 121.83336999999995, "r": 400.37723, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 121.53448000000003, "r": 425.37775, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 121.53448000000003, "r": 457.41745000000003, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 121.83336999999995, "r": 496.3262, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 121.83336999999995, "r": 532.56012, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 133.78839000000005, "r": 375.17184, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 133.48950000000002, "r": 425.37775, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 133.48950000000002, "r": 457.41745000000003, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 133.78839000000005, "r": 496.3262, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 133.78839000000005, "r": 532.56012, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 145.74341000000004, "r": 369.39352, "b": 154.64995999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 145.44446000000005, "r": 425.37775, "b": 154.65985, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 145.44446000000005, "r": 457.41745000000003, "b": 154.65985, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 145.74334999999996, "r": 496.3262, "b": 154.6499, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 145.74334999999996, "r": 532.56012, "b": 154.6499, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 10, "page_no": 3, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36511, "b": 96.06994999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9611433148384094, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36511, "r_y1": 84.11492999999996, "r_x2": 286.36511, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 212.28319, "r_y1": 96.06994999999995, "r_x2": 212.28319, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)." }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 100.96038999999996, "r": 286.36514, "b": 313.10507, "coord_origin": "TOPLEFT" }, "confidence": 0.988013744354248, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 109.86694, "r_x1": 286.36502, "r_y1": 109.86694, "r_x2": 286.36502, "r_y2": 100.96038999999996, "r_x3": 62.067001, "r_y3": 100.96038999999996, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 121.82195999999999, "r_x1": 286.36508, "r_y1": 121.82195999999999, "r_x2": 286.36508, "r_y2": 112.91540999999995, "r_x3": 50.112, "r_y3": 112.91540999999995, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 133.77697999999998, "r_x1": 286.36508, "r_y1": 133.77697999999998, "r_x2": 286.36508, "r_y2": 124.87041999999997, "r_x3": 50.112, "r_y3": 124.87041999999997, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 145.73297000000002, "r_x1": 286.36511, "r_y1": 145.73297000000002, "r_x2": 286.36511, "r_y2": 136.82641999999998, "r_x3": 50.112, "r_y3": 136.82641999999998, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 157.68799, "r_x1": 286.36511, "r_y1": 157.68799, "r_x2": 286.36511, "r_y2": 148.78143, "r_x3": 50.112, "r_y3": 148.78143, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 169.64301, "r_x1": 286.36508, "r_y1": 169.64301, "r_x2": 286.36508, "r_y2": 160.73645, "r_x3": 50.112, "r_y3": 160.73645, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 181.59802000000002, "r_x1": 286.36505, "r_y1": 181.59802000000002, "r_x2": 286.36505, "r_y2": 172.69146999999998, "r_x3": 50.112, "r_y3": 172.69146999999998, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 193.55304, "r_x1": 286.36508, "r_y1": 193.55304, "r_x2": 286.36508, "r_y2": 184.64648, "r_x3": 50.112, "r_y3": 184.64648, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 205.50903000000005, "r_x1": 286.36508, "r_y1": 205.50903000000005, "r_x2": 286.36508, "r_y2": 196.60248, "r_x3": 50.112, "r_y3": 196.60248, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 217.46405000000004, "r_x1": 286.36508, "r_y1": 217.46405000000004, "r_x2": 286.36508, "r_y2": 208.5575, "r_x3": 50.112, "r_y3": 208.5575, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 229.41907000000003, "r_x1": 286.36511, "r_y1": 229.41907000000003, "r_x2": 286.36511, "r_y2": 220.51251000000002, "r_x3": 50.112, "r_y3": 220.51251000000002, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 241.37408000000005, "r_x1": 286.36508, "r_y1": 241.37408000000005, "r_x2": 286.36508, "r_y2": 232.46753, "r_x3": 50.112, "r_y3": 232.46753, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 253.32910000000004, "r_x1": 286.36508, "r_y1": 253.32910000000004, "r_x2": 286.36508, "r_y2": 244.42255, "r_x3": 50.112, "r_y3": 244.42255, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 265.28412000000003, "r_x1": 286.36505, "r_y1": 265.28412000000003, "r_x2": 286.36505, "r_y2": 256.37756, "r_x3": 50.112, "r_y3": 256.37756, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 277.24010999999996, "r_x1": 286.36505, "r_y1": 277.24010999999996, "r_x2": 286.36505, "r_y2": 268.33356000000003, "r_x3": 50.112, "r_y3": 268.33356000000003, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 289.1951, "r_x1": 68.652397, "r_y1": 289.1951, "r_x2": 68.652397, "r_y2": 280.28853999999995, "r_x3": 50.112, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.566444, "r_y0": 289.1951, "r_x1": 286.36514, "r_y1": 289.1951, "r_x2": 286.36514, "r_y2": 280.28853999999995, "r_x3": 75.566444, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 301.15009, "r_x1": 286.36511, "r_y1": 301.15009, "r_x2": 286.36511, "r_y2": 292.24353, "r_x3": 50.112, "r_y3": 292.24353, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 313.10507, "r_x1": 75.695961, "r_y1": 313.10507, "r_x2": 75.695961, "r_y2": 304.19852000000003, "r_x3": 50.112, "r_y3": 304.19852000000003, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 317.99550999999997, "r": 286.36511, "b": 434.49896, "coord_origin": "TOPLEFT" }, "confidence": 0.9873981475830078, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 326.90207, "r_x1": 286.36499, "r_y1": 326.90207, "r_x2": 286.36499, "r_y2": 317.99550999999997, "r_x3": 62.067001, "r_y3": 317.99550999999997, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 338.8580600000001, "r_x1": 286.36511, "r_y1": 338.8580600000001, "r_x2": 286.36511, "r_y2": 329.95151, "r_x3": 50.112, "r_y3": 329.95151, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 350.81305, "r_x1": 286.36502, "r_y1": 350.81305, "r_x2": 286.36502, "r_y2": 341.90649, "r_x3": 50.112, "r_y3": 341.90649, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 362.76804, "r_x1": 286.36505, "r_y1": 362.76804, "r_x2": 286.36505, "r_y2": 353.8614799999999, "r_x3": 50.112, "r_y3": 353.8614799999999, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 374.72301999999996, "r_x1": 286.36508, "r_y1": 374.72301999999996, "r_x2": 286.36508, "r_y2": 365.81647, "r_x3": 50.112, "r_y3": 365.81647, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 386.67801, "r_x1": 141.58859, "r_y1": 386.67801, "r_x2": 141.58859, "r_y2": 377.77145, "r_x3": 50.112, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.70189, "r_y0": 386.67801, "r_x1": 286.36508, "r_y1": 386.67801, "r_x2": 286.36508, "r_y2": 377.77145, "r_x3": 148.70189, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 398.63300000000004, "r_x1": 286.36508, "r_y1": 398.63300000000004, "r_x2": 286.36508, "r_y2": 389.72644, "r_x3": 50.112, "r_y3": 389.72644, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 410.58899, "r_x1": 286.36511, "r_y1": 410.58899, "r_x2": 286.36511, "r_y2": 401.68243, "r_x3": 50.112, "r_y3": 401.68243, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 422.54398, "r_x1": 286.36511, "r_y1": 422.54398, "r_x2": 286.36511, "r_y2": 413.63742, "r_x3": 50.112, "r_y3": 413.63742, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 434.49896, "r_x1": 216.39774, "r_y1": 434.49896, "r_x2": 216.39774, "r_y2": 425.59241, "r_x3": 50.112, "r_y3": 425.59241, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data." }, { "label": "text", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.112, "t": 439.3894, "r": 286.36655, "b": 627.62389, "coord_origin": "TOPLEFT" }, "confidence": 0.9876030087471008, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 448.2959599999999, "r_x1": 286.36499, "r_y1": 448.2959599999999, "r_x2": 286.36499, "r_y2": 439.3894, "r_x3": 62.067001, "r_y3": 439.3894, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 460.25095, "r_x1": 172.14388, "r_y1": 460.25095, "r_x2": 172.14388, "r_y2": 451.34439, "r_x3": 50.112, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.14801, "r_y0": 460.02182, "r_x1": 224.70818999999997, "r_y1": 460.02182, "r_x2": 224.70818999999997, "r_y2": 451.43405, "r_x3": 174.14801, "r_y3": 451.43405, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.70801, "r_y0": 460.25095, "r_x1": 286.36655, "r_y1": 460.25095, "r_x2": 286.36655, "r_y2": 451.34439, "r_x3": 224.70801, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 472.20694, "r_x1": 286.36505, "r_y1": 472.20694, "r_x2": 286.36505, "r_y2": 463.30038, "r_x3": 50.112015, "r_y3": 463.30038, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 484.16193, "r_x1": 286.36511, "r_y1": 484.16193, "r_x2": 286.36511, "r_y2": 475.25537, "r_x3": 50.112015, "r_y3": 475.25537, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 496.11691, "r_x1": 286.36511, "r_y1": 496.11691, "r_x2": 286.36511, "r_y2": 487.21036, "r_x3": 50.112015, "r_y3": 487.21036, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 508.0719, "r_x1": 286.36508, "r_y1": 508.0719, "r_x2": 286.36508, "r_y2": 499.16534, "r_x3": 50.112015, "r_y3": 499.16534, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 520.02689, "r_x1": 286.36505, "r_y1": 520.02689, "r_x2": 286.36505, "r_y2": 511.12033, "r_x3": 50.112015, "r_y3": 511.12033, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 531.98288, "r_x1": 286.36508, "r_y1": 531.98288, "r_x2": 286.36508, "r_y2": 523.07632, "r_x3": 50.112015, "r_y3": 523.07632, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 543.93788, "r_x1": 286.36508, "r_y1": 543.93788, "r_x2": 286.36508, "r_y2": 535.0313100000001, "r_x3": 50.112015, "r_y3": 535.0313100000001, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 555.89288, "r_x1": 286.36511, "r_y1": 555.89288, "r_x2": 286.36511, "r_y2": 546.98633, "r_x3": 50.112015, "r_y3": 546.98633, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 567.84789, "r_x1": 286.36508, "r_y1": 567.84789, "r_x2": 286.36508, "r_y2": 558.94133, "r_x3": 50.112015, "r_y3": 558.94133, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 579.8028899999999, "r_x1": 286.36511, "r_y1": 579.8028899999999, "r_x2": 286.36511, "r_y2": 570.89633, "r_x3": 50.112015, "r_y3": 570.89633, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 591.75789, "r_x1": 286.36511, "r_y1": 591.75789, "r_x2": 286.36511, "r_y2": 582.85133, "r_x3": 50.112015, "r_y3": 582.85133, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 603.71388, "r_x1": 286.36505, "r_y1": 603.71388, "r_x2": 286.36505, "r_y2": 594.80733, "r_x3": 50.112015, "r_y3": 594.80733, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 615.6688800000001, "r_x1": 286.36508, "r_y1": 615.6688800000001, "r_x2": 286.36508, "r_y2": 606.76233, "r_x3": 50.112015, "r_y3": 606.76233, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 627.62389, "r_x1": 209.7527, "r_y1": 627.62389, "r_x2": 209.7527, "r_y2": 618.71733, "r_x3": 50.112015, "r_y3": 618.71733, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain." }, { "label": "text", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.112015, "t": 632.51433, "r": 286.36511, "b": 713.151894, "coord_origin": "TOPLEFT" }, "confidence": 0.9871614575386047, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067017, "r_y0": 641.42088, "r_x1": 286.36499, "r_y1": 641.42088, "r_x2": 286.36499, "r_y2": 632.51433, "r_x3": 62.067017, "r_y3": 632.51433, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 653.37589, "r_x1": 286.36508, "r_y1": 653.37589, "r_x2": 286.36508, "r_y2": 644.46933, "r_x3": 50.112015, "r_y3": 644.46933, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.33189, "r_x1": 286.36511, "r_y1": 665.33189, "r_x2": 286.36511, "r_y2": 656.42532, "r_x3": 50.112015, "r_y3": 656.42532, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28689, "r_x1": 286.36505, "r_y1": 677.28689, "r_x2": 286.36505, "r_y2": 668.38033, "r_x3": 50.112015, "r_y3": 668.38033, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24189, "r_x1": 286.36508, "r_y1": 689.24189, "r_x2": 286.36508, "r_y2": 680.33533, "r_x3": 50.112015, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.196892, "r_x1": 286.36508, "r_y1": 701.196892, "r_x2": 286.36508, "r_y2": 692.290329, "r_x3": 50.112015, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151894, "r_x1": 286.36511, "r_y1": 713.151894, "r_x2": 286.36511, "r_y2": 704.245331, "r_x3": 50.112015, "r_y3": 704.245331, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third" }, { "label": "table", "id": 8, "page_no": 3, "cluster": { "id": 8, "label": "table", "bbox": { "l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT" }, "confidence": 0.9777463674545288, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.332, "t": 73.61437999999998, "r": 430.90231, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.85742, "t": 73.61437999999998, "r": 464.4463799999999, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.78632, "t": 73.61437999999998, "r": 494.94193, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28186, "t": 73.61437999999998, "r": 536.91437, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.9673499999999, "r": 361.64264, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.85599, "t": 85.6684600000001, "r": 425.37775, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.89569, "t": 85.6684600000001, "r": 457.41745000000003, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.401, "t": 85.9673499999999, "r": 496.3262, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63495, "t": 85.9673499999999, "r": 532.56012, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92236000000003, "r": 359.43094, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.85599, "t": 97.62347, "r": 425.37775, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.89569, "t": 97.62347, "r": 457.41745000000003, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.401, "t": 97.92236000000003, "r": 496.3262, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46185, "t": 97.92236000000003, "r": 531.73328, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.87836000000004, "r": 359.97888, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.85599, "t": 109.57947000000001, "r": 425.37775, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81226, "t": 109.57947000000001, "r": 456.50091999999995, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.401, "t": 109.87836000000004, "r": 496.3262, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25017999999994, "t": 109.87836000000004, "r": 533.94501, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83336999999995, "r": 400.37723, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.85599, "t": 121.53448000000003, "r": 425.37775, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.89569, "t": 121.53448000000003, "r": 457.41745000000003, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.401, "t": 121.83336999999995, "r": 496.3262, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63495, "t": 121.83336999999995, "r": 532.56012, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.78839000000005, "r": 375.17184, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.85599, "t": 133.48950000000002, "r": 425.37775, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.89569, "t": 133.48950000000002, "r": 457.41745000000003, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.401, "t": 133.78839000000005, "r": 496.3262, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63495, "t": 133.78839000000005, "r": 532.56012, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74341000000004, "r": 369.39352, "b": 154.64995999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.85599, "t": 145.44446000000005, "r": 425.37775, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.89569, "t": 145.44446000000005, "r": 457.41745000000003, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.401, "t": 145.74334999999996, "r": 496.3262, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63495, "t": 145.74334999999996, "r": 532.56012, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 412.332, "t": 73.61437999999998, "r": 430.90231, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 442.85742, "t": 73.61437999999998, "r": 464.4463799999999, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 477.78632, "t": 73.61437999999998, "r": 494.94193, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 508.28186, "t": 73.61437999999998, "r": 536.91437, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 85.9673499999999, "r": 361.64264, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 85.6684600000001, "r": 425.37775, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 85.6684600000001, "r": 457.41745000000003, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 85.9673499999999, "r": 496.3262, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 85.9673499999999, "r": 532.56012, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 97.92236000000003, "r": 359.43094, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 97.62347, "r": 425.37775, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 97.62347, "r": 457.41745000000003, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 97.92236000000003, "r": 496.3262, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.46185, "t": 97.92236000000003, "r": 531.73328, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 109.87836000000004, "r": 359.97888, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 109.57947000000001, "r": 425.37775, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 450.81226, "t": 109.57947000000001, "r": 456.50091999999995, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 109.87836000000004, "r": 496.3262, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 511.25017999999994, "t": 109.87836000000004, "r": 533.94501, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 121.83336999999995, "r": 400.37723, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 121.53448000000003, "r": 425.37775, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 121.53448000000003, "r": 457.41745000000003, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 121.83336999999995, "r": 496.3262, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 121.83336999999995, "r": 532.56012, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 133.78839000000005, "r": 375.17184, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 133.48950000000002, "r": 425.37775, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 133.48950000000002, "r": 457.41745000000003, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 133.78839000000005, "r": 496.3262, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 133.78839000000005, "r": 532.56012, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 145.74341000000004, "r": 369.39352, "b": 154.64995999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 145.44446000000005, "r": 425.37775, "b": 154.65985, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 145.44446000000005, "r": 457.41745000000003, "b": 154.65985, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 145.74334999999996, "r": 496.3262, "b": 154.6499, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 145.74334999999996, "r": 532.56012, "b": 154.6499, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 9, "page_no": 3, "cluster": { "id": 9, "label": "caption", "bbox": { "l": 308.862, "t": 167.66138, "r": 545.11505, "b": 224.38897999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9667726755142212, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 176.56793000000005, "r_x1": 344.6178, "r_y1": 176.56793000000005, "r_x2": 344.6178, "r_y2": 167.66138, "r_x3": 308.862, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.07602, "r_y0": 176.56793000000005, "r_x1": 380.45328, "r_y1": 176.56793000000005, "r_x2": 380.45328, "r_y2": 167.66138, "r_x3": 361.07602, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.56799, "r_y0": 176.33880999999997, "r_x1": 468.67974999999996, "r_y1": 176.33880999999997, "r_x2": 468.67974999999996, "r_y2": 167.75104, "r_x3": 386.56799, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.79599, "r_y0": 176.56793000000005, "r_x1": 489.18198, "r_y1": 176.56793000000005, "r_x2": 489.18198, "r_y2": 167.66138, "r_x3": 474.79599, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.29898000000003, "r_y0": 176.33880999999997, "r_x1": 545.112, "r_y1": 176.33880999999997, "r_x2": 545.112, "r_y2": 167.75104, "r_x3": 495.29898000000003, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 188.29381999999998, "r_x1": 341.16077, "r_y1": 188.29381999999998, "r_x2": 341.16077, "r_y2": 179.70605, "r_x3": 308.862, "r_y3": 179.70605, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.457, "r_y0": 188.52295000000004, "r_x1": 545.11005, "r_y1": 188.52295000000004, "r_x2": 545.11005, "r_y2": 179.61639000000002, "r_x3": 343.457, "r_y3": 179.61639000000002, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 200.47797000000003, "r_x1": 545.11505, "r_y1": 200.47797000000003, "r_x2": 545.11505, "r_y2": 191.57141000000001, "r_x3": 308.862, "r_y3": 191.57141000000001, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 212.43298000000004, "r_x1": 545.11499, "r_y1": 212.43298000000004, "r_x2": 545.11499, "r_y2": 203.52643, "r_x3": 308.862, "r_y3": 203.52643, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 224.38897999999995, "r_x1": 523.93469, "r_y1": 224.38897999999995, "r_x2": 523.93469, "r_y2": 215.48242000000005, "r_x3": 308.862, "r_y3": 215.48242000000005, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank." }, { "label": "text", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "text", "bbox": { "l": 308.862, "t": 249.62041999999997, "r": 545.11517, "b": 294.39197, "coord_origin": "TOPLEFT" }, "confidence": 0.978954017162323, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.52698, "r_x1": 545.11517, "r_y1": 258.52698, "r_x2": 545.11517, "r_y2": 249.62041999999997, "r_x3": 308.862, "r_y3": 249.62041999999997, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.48199, "r_x1": 545.11517, "r_y1": 270.48199, "r_x2": 545.11517, "r_y2": 261.57543999999996, "r_x3": 308.862, "r_y3": 261.57543999999996, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.43698, "r_x1": 545.11505, "r_y1": 282.43698, "r_x2": 545.11505, "r_y2": 273.5304, "r_x3": 308.862, "r_y3": 273.5304, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.39197, "r_x1": 436.82169, "r_y1": 294.39197, "r_x2": 436.82169, "r_y2": 285.48541000000006, "r_x3": 308.862, "r_y3": 285.48541000000006, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples." }, { "label": "text", "id": 13, "page_no": 3, "cluster": { "id": 13, "label": "text", "bbox": { "l": 320.81699, "t": 297.77240000000006, "r": 542.74396, "b": 306.67896, "coord_origin": "TOPLEFT" }, "confidence": 0.9043695330619812, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 306.67896, "r_x1": 542.74396, "r_y1": 306.67896, "r_x2": 542.74396, "r_y2": 297.77240000000006, "r_x3": 320.81699, "r_y3": 297.77240000000006, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tab. 1 summarizes the various attributes of the datasets." }, { "label": "section_header", "id": 11, "page_no": 3, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 308.862, "t": 321.18396, "r": 444.93607000000003, "b": 331.93167000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9466595649719238, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 331.93167000000005, "r_x1": 316.28476, "r_y1": 331.93167000000005, "r_x2": 316.28476, "r_y2": 321.18396, "r_x3": 308.862, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18176, "r_y0": 331.93167000000005, "r_x1": 444.93607000000003, "r_y1": 331.93167000000005, "r_x2": 444.93607000000003, "r_y2": 321.18396, "r_x3": 326.18176, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. The TableFormer model" }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 341.93939, "r": 545.11523, "b": 446.48685000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.9884450435638428, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 350.84594999999996, "r_x1": 545.11499, "r_y1": 350.84594999999996, "r_x2": 545.11499, "r_y2": 341.93939, "r_x3": 320.81699, "r_y3": 341.93939, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 362.80092999999994, "r_x1": 545.11511, "r_y1": 362.80092999999994, "r_x2": 545.11511, "r_y2": 353.89438, "r_x3": 308.862, "r_y3": 353.89438, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 374.75592, "r_x1": 545.11517, "r_y1": 374.75592, "r_x2": 545.11517, "r_y2": 365.84937, "r_x3": 308.862, "r_y3": 365.84937, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 386.71091, "r_x1": 545.11505, "r_y1": 386.71091, "r_x2": 545.11505, "r_y2": 377.80435, "r_x3": 308.862, "r_y3": 377.80435, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 398.66588999999993, "r_x1": 545.11517, "r_y1": 398.66588999999993, "r_x2": 545.11517, "r_y2": 389.75934000000007, "r_x3": 308.862, "r_y3": 389.75934000000007, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 410.62088, "r_x1": 545.11523, "r_y1": 410.62088, "r_x2": 545.11523, "r_y2": 401.71432000000004, "r_x3": 308.862, "r_y3": 401.71432000000004, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 422.57687, "r_x1": 545.11517, "r_y1": 422.57687, "r_x2": 545.11517, "r_y2": 413.67032, "r_x3": 308.862, "r_y3": 413.67032, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 434.53186, "r_x1": 545.11505, "r_y1": 434.53186, "r_x2": 545.11505, "r_y2": 425.62531, "r_x3": 308.862, "r_y3": 425.62531, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 446.48685000000006, "r_x1": 437.9375, "r_y1": 446.48685000000006, "r_x2": 437.9375, "r_y2": 437.58029, "r_x3": 308.862, "r_y3": 437.58029, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required." }, { "label": "section_header", "id": 12, "page_no": 3, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 308.862, "t": 457.69427, "r": 420.16058, "b": 467.54633, "coord_origin": "TOPLEFT" }, "confidence": 0.937696099281311, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 467.54633, "r_x1": 323.14081, "r_y1": 467.54633, "r_x2": 323.14081, "r_y2": 457.69427, "r_x3": 308.862, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66003, "r_y0": 467.54633, "r_x1": 420.16058, "r_y1": 467.54633, "r_x2": 420.16058, "r_y2": 457.69427, "r_x3": 332.66003, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1. Model architecture." }, { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86197, "t": 476.76529, "r": 545.11572, "b": 664.99981, "coord_origin": "TOPLEFT" }, "confidence": 0.9878323078155518, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 485.67184, "r_x1": 545.11487, "r_y1": 485.67184, "r_x2": 545.11487, "r_y2": 476.76529, "r_x3": 320.81699, "r_y3": 476.76529, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.62683, "r_x1": 509.02054, "r_y1": 497.62683, "r_x2": 509.02054, "r_y2": 488.72028, "r_x3": 308.862, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.58588, "r_y0": 497.62683, "r_x1": 523.05786, "r_y1": 497.62683, "r_x2": 523.05786, "r_y2": 488.72028, "r_x3": 515.58588, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 497.62683, "r_x1": 545.11505, "r_y1": 497.62683, "r_x2": 545.11505, "r_y2": 488.72028, "r_x3": 529.62323, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 509.35269, "r_x1": 406.34601, "r_y1": 509.35269, "r_x2": 406.34601, "r_y2": 500.76492, "r_x3": 308.862, "r_y3": 500.76492, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87201, "r_y0": 509.58182, "r_x1": 545.1106, "r_y1": 509.58182, "r_x2": 545.1106, "r_y2": 500.67526, "r_x3": 408.87201, "r_y3": 500.67526, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 521.53781, "r_x1": 409.39459, "r_y1": 521.53781, "r_x2": 409.39459, "r_y2": 512.63126, "r_x3": 308.862, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.72705, "r_y0": 521.53781, "r_x1": 545.11505, "r_y1": 521.53781, "r_x2": 545.11505, "r_y2": 512.63126, "r_x3": 416.72705, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.4928, "r_x1": 436.194, "r_y1": 533.4928, "r_x2": 436.194, "r_y2": 524.58624, "r_x3": 308.862, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.526, "r_y0": 533.26367, "r_x1": 513.86694, "r_y1": 533.26367, "r_x2": 513.86694, "r_y2": 524.6759, "r_x3": 439.526, "r_y3": 524.6759, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43201, "r_y0": 533.4928, "r_x1": 545.10815, "r_y1": 533.4928, "r_x2": 545.10815, "r_y2": 524.58624, "r_x3": 517.43201, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.4478, "r_x1": 545.11511, "r_y1": 545.4478, "r_x2": 545.11511, "r_y2": 536.54124, "r_x3": 308.862, "r_y3": 536.54124, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.4028000000001, "r_x1": 358.5455, "r_y1": 557.4028000000001, "r_x2": 358.5455, "r_y2": 548.49625, "r_x3": 308.862, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19055, "r_y0": 557.4028000000001, "r_x1": 545.11517, "r_y1": 557.4028000000001, "r_x2": 545.11517, "r_y2": 548.49625, "r_x3": 365.19055, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.3578, "r_x1": 352.40851, "r_y1": 569.3578, "r_x2": 352.40851, "r_y2": 560.45125, "r_x3": 308.862, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.409, "r_y0": 569.13863, "r_x1": 360.1579, "r_y1": 569.13863, "r_x2": 360.1579, "r_y2": 560.29184, "r_x3": 352.409, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.15799, "r_y0": 569.3578, "r_x1": 367.90891, "r_y1": 569.3578, "r_x2": 367.90891, "r_y2": 560.45125, "r_x3": 360.15799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.909, "r_y0": 569.13863, "r_x1": 375.6579, "r_y1": 569.13863, "r_x2": 375.6579, "r_y2": 560.29184, "r_x3": 367.909, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.65799, "r_y0": 569.3578, "r_x1": 545.11182, "r_y1": 569.3578, "r_x2": 545.11182, "r_y2": 560.45125, "r_x3": 375.65799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.3138, "r_x1": 545.11499, "r_y1": 581.3138, "r_x2": 545.11499, "r_y2": 572.40724, "r_x3": 308.862, "r_y3": 572.40724, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.2688, "r_x1": 483.11768, "r_y1": 593.2688, "r_x2": 483.11768, "r_y2": 584.3622399999999, "r_x3": 308.862, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 593.04962, "r_x1": 490.86792, "r_y1": 593.04962, "r_x2": 490.86792, "r_y2": 584.20284, "r_x3": 483.11902, "r_y3": 584.20284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.86800999999997, "r_y0": 593.2688, "r_x1": 545.11438, "r_y1": 593.2688, "r_x2": 545.11438, "r_y2": 584.3622399999999, "r_x3": 490.86800999999997, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2238, "r_x1": 545.11493, "r_y1": 605.2238, "r_x2": 545.11493, "r_y2": 596.31725, "r_x3": 308.862, "r_y3": 596.31725, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.1788, "r_x1": 329.64395, "r_y1": 617.1788, "r_x2": 329.64395, "r_y2": 608.27225, "r_x3": 308.862, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.646, "r_y0": 616.9596300000001, "r_x1": 337.3949, "r_y1": 616.9596300000001, "r_x2": 337.3949, "r_y2": 608.11284, "r_x3": 329.646, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39398, "r_y0": 617.1788, "r_x1": 468.5914, "r_y1": 617.1788, "r_x2": 468.5914, "r_y2": 608.27225, "r_x3": 337.39398, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59496999999993, "r_y0": 616.9596300000001, "r_x1": 476.34387000000004, "r_y1": 616.9596300000001, "r_x2": 476.34387000000004, "r_y2": 608.11284, "r_x3": 468.59496999999993, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.3439599999999, "r_y0": 617.1788, "r_x1": 545.11572, "r_y1": 617.1788, "r_x2": 545.11572, "r_y2": 608.27225, "r_x3": 476.3439599999999, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.1338000000001, "r_x1": 545.11499, "r_y1": 629.1338000000001, "r_x2": 545.11499, "r_y2": 620.22725, "r_x3": 308.86197, "r_y3": 620.22725, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.08881, "r_x1": 545.11517, "r_y1": 641.08881, "r_x2": 545.11517, "r_y2": 632.1822500000001, "r_x3": 308.86197, "r_y3": 632.1822500000001, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.0448, "r_x1": 545.11511, "r_y1": 653.0448, "r_x2": 545.11511, "r_y2": 644.13824, "r_x3": 308.86197, "r_y3": 644.13824, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 664.99981, "r_x1": 449.42432, "r_y1": 664.99981, "r_x2": 449.42432, "r_y2": 656.09325, "r_x3": 308.86197, "r_y3": 656.09325, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification." }, { "label": "text", "id": 7, "page_no": 3, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.86197, "t": 668.2607, "r": 545.11511, "b": 713.1518169999999, "coord_origin": "TOPLEFT" }, "confidence": 0.978580117225647, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 677.21707, "r_x1": 431.90985, "r_y1": 677.21707, "r_x2": 431.90985, "r_y2": 668.2607, "r_x3": 320.81696, "r_y3": 668.2607, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.49896, "r_y0": 677.2868100000001, "r_x1": 545.11255, "r_y1": 677.2868100000001, "r_x2": 545.11255, "r_y2": 668.3802499999999, "r_x3": 439.49896, "r_y3": 668.3802499999999, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 689.24181, "r_x1": 545.11499, "r_y1": 689.24181, "r_x2": 545.11499, "r_y2": 680.33525, "r_x3": 308.86197, "r_y3": 680.33525, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 701.196815, "r_x1": 545.11511, "r_y1": 701.196815, "r_x2": 545.11511, "r_y2": 692.290253, "r_x3": 308.86197, "r_y3": 692.290253, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 713.1518169999999, "r_x1": 545.11505, "r_y1": 713.1518169999999, "r_x2": 545.11505, "r_y2": 704.245255, "r_x3": 308.86197, "r_y3": 704.245255, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-" }, { "label": "page_footer", "id": 14, "page_no": 3, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.12097, "t": 734.133251, "r": 300.10226, "b": 743.039814, "coord_origin": "TOPLEFT" }, "confidence": 0.8565718531608582, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12097, "r_y0": 743.039814, "r_x1": 300.10226, "r_y1": 743.039814, "r_x2": 300.10226, "r_y2": 734.133251, "r_x3": 295.12097, "r_y3": 734.133251, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" } ], "body": [ { "label": "text", "id": 10, "page_no": 3, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36511, "b": 96.06994999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9611433148384094, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36511, "r_y1": 84.11492999999996, "r_x2": 286.36511, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 212.28319, "r_y1": 96.06994999999995, "r_x2": 212.28319, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)." }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 100.96038999999996, "r": 286.36514, "b": 313.10507, "coord_origin": "TOPLEFT" }, "confidence": 0.988013744354248, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 109.86694, "r_x1": 286.36502, "r_y1": 109.86694, "r_x2": 286.36502, "r_y2": 100.96038999999996, "r_x3": 62.067001, "r_y3": 100.96038999999996, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 121.82195999999999, "r_x1": 286.36508, "r_y1": 121.82195999999999, "r_x2": 286.36508, "r_y2": 112.91540999999995, "r_x3": 50.112, "r_y3": 112.91540999999995, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 133.77697999999998, "r_x1": 286.36508, "r_y1": 133.77697999999998, "r_x2": 286.36508, "r_y2": 124.87041999999997, "r_x3": 50.112, "r_y3": 124.87041999999997, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 145.73297000000002, "r_x1": 286.36511, "r_y1": 145.73297000000002, "r_x2": 286.36511, "r_y2": 136.82641999999998, "r_x3": 50.112, "r_y3": 136.82641999999998, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 157.68799, "r_x1": 286.36511, "r_y1": 157.68799, "r_x2": 286.36511, "r_y2": 148.78143, "r_x3": 50.112, "r_y3": 148.78143, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 169.64301, "r_x1": 286.36508, "r_y1": 169.64301, "r_x2": 286.36508, "r_y2": 160.73645, "r_x3": 50.112, "r_y3": 160.73645, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 181.59802000000002, "r_x1": 286.36505, "r_y1": 181.59802000000002, "r_x2": 286.36505, "r_y2": 172.69146999999998, "r_x3": 50.112, "r_y3": 172.69146999999998, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 193.55304, "r_x1": 286.36508, "r_y1": 193.55304, "r_x2": 286.36508, "r_y2": 184.64648, "r_x3": 50.112, "r_y3": 184.64648, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 205.50903000000005, "r_x1": 286.36508, "r_y1": 205.50903000000005, "r_x2": 286.36508, "r_y2": 196.60248, "r_x3": 50.112, "r_y3": 196.60248, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 217.46405000000004, "r_x1": 286.36508, "r_y1": 217.46405000000004, "r_x2": 286.36508, "r_y2": 208.5575, "r_x3": 50.112, "r_y3": 208.5575, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 229.41907000000003, "r_x1": 286.36511, "r_y1": 229.41907000000003, "r_x2": 286.36511, "r_y2": 220.51251000000002, "r_x3": 50.112, "r_y3": 220.51251000000002, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 241.37408000000005, "r_x1": 286.36508, "r_y1": 241.37408000000005, "r_x2": 286.36508, "r_y2": 232.46753, "r_x3": 50.112, "r_y3": 232.46753, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 253.32910000000004, "r_x1": 286.36508, "r_y1": 253.32910000000004, "r_x2": 286.36508, "r_y2": 244.42255, "r_x3": 50.112, "r_y3": 244.42255, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 265.28412000000003, "r_x1": 286.36505, "r_y1": 265.28412000000003, "r_x2": 286.36505, "r_y2": 256.37756, "r_x3": 50.112, "r_y3": 256.37756, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 277.24010999999996, "r_x1": 286.36505, "r_y1": 277.24010999999996, "r_x2": 286.36505, "r_y2": 268.33356000000003, "r_x3": 50.112, "r_y3": 268.33356000000003, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 289.1951, "r_x1": 68.652397, "r_y1": 289.1951, "r_x2": 68.652397, "r_y2": 280.28853999999995, "r_x3": 50.112, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.566444, "r_y0": 289.1951, "r_x1": 286.36514, "r_y1": 289.1951, "r_x2": 286.36514, "r_y2": 280.28853999999995, "r_x3": 75.566444, "r_y3": 280.28853999999995, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 301.15009, "r_x1": 286.36511, "r_y1": 301.15009, "r_x2": 286.36511, "r_y2": 292.24353, "r_x3": 50.112, "r_y3": 292.24353, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 313.10507, "r_x1": 75.695961, "r_y1": 313.10507, "r_x2": 75.695961, "r_y2": 304.19852000000003, "r_x3": 50.112, "r_y3": 304.19852000000003, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 317.99550999999997, "r": 286.36511, "b": 434.49896, "coord_origin": "TOPLEFT" }, "confidence": 0.9873981475830078, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 326.90207, "r_x1": 286.36499, "r_y1": 326.90207, "r_x2": 286.36499, "r_y2": 317.99550999999997, "r_x3": 62.067001, "r_y3": 317.99550999999997, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 338.8580600000001, "r_x1": 286.36511, "r_y1": 338.8580600000001, "r_x2": 286.36511, "r_y2": 329.95151, "r_x3": 50.112, "r_y3": 329.95151, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 350.81305, "r_x1": 286.36502, "r_y1": 350.81305, "r_x2": 286.36502, "r_y2": 341.90649, "r_x3": 50.112, "r_y3": 341.90649, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 362.76804, "r_x1": 286.36505, "r_y1": 362.76804, "r_x2": 286.36505, "r_y2": 353.8614799999999, "r_x3": 50.112, "r_y3": 353.8614799999999, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 374.72301999999996, "r_x1": 286.36508, "r_y1": 374.72301999999996, "r_x2": 286.36508, "r_y2": 365.81647, "r_x3": 50.112, "r_y3": 365.81647, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 386.67801, "r_x1": 141.58859, "r_y1": 386.67801, "r_x2": 141.58859, "r_y2": 377.77145, "r_x3": 50.112, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.70189, "r_y0": 386.67801, "r_x1": 286.36508, "r_y1": 386.67801, "r_x2": 286.36508, "r_y2": 377.77145, "r_x3": 148.70189, "r_y3": 377.77145, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 398.63300000000004, "r_x1": 286.36508, "r_y1": 398.63300000000004, "r_x2": 286.36508, "r_y2": 389.72644, "r_x3": 50.112, "r_y3": 389.72644, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 410.58899, "r_x1": 286.36511, "r_y1": 410.58899, "r_x2": 286.36511, "r_y2": 401.68243, "r_x3": 50.112, "r_y3": 401.68243, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 422.54398, "r_x1": 286.36511, "r_y1": 422.54398, "r_x2": 286.36511, "r_y2": 413.63742, "r_x3": 50.112, "r_y3": 413.63742, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 434.49896, "r_x1": 216.39774, "r_y1": 434.49896, "r_x2": 216.39774, "r_y2": 425.59241, "r_x3": 50.112, "r_y3": 425.59241, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data." }, { "label": "text", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.112, "t": 439.3894, "r": 286.36655, "b": 627.62389, "coord_origin": "TOPLEFT" }, "confidence": 0.9876030087471008, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 448.2959599999999, "r_x1": 286.36499, "r_y1": 448.2959599999999, "r_x2": 286.36499, "r_y2": 439.3894, "r_x3": 62.067001, "r_y3": 439.3894, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 460.25095, "r_x1": 172.14388, "r_y1": 460.25095, "r_x2": 172.14388, "r_y2": 451.34439, "r_x3": 50.112, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.14801, "r_y0": 460.02182, "r_x1": 224.70818999999997, "r_y1": 460.02182, "r_x2": 224.70818999999997, "r_y2": 451.43405, "r_x3": 174.14801, "r_y3": 451.43405, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.70801, "r_y0": 460.25095, "r_x1": 286.36655, "r_y1": 460.25095, "r_x2": 286.36655, "r_y2": 451.34439, "r_x3": 224.70801, "r_y3": 451.34439, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 472.20694, "r_x1": 286.36505, "r_y1": 472.20694, "r_x2": 286.36505, "r_y2": 463.30038, "r_x3": 50.112015, "r_y3": 463.30038, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 484.16193, "r_x1": 286.36511, "r_y1": 484.16193, "r_x2": 286.36511, "r_y2": 475.25537, "r_x3": 50.112015, "r_y3": 475.25537, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 496.11691, "r_x1": 286.36511, "r_y1": 496.11691, "r_x2": 286.36511, "r_y2": 487.21036, "r_x3": 50.112015, "r_y3": 487.21036, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 508.0719, "r_x1": 286.36508, "r_y1": 508.0719, "r_x2": 286.36508, "r_y2": 499.16534, "r_x3": 50.112015, "r_y3": 499.16534, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 520.02689, "r_x1": 286.36505, "r_y1": 520.02689, "r_x2": 286.36505, "r_y2": 511.12033, "r_x3": 50.112015, "r_y3": 511.12033, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 531.98288, "r_x1": 286.36508, "r_y1": 531.98288, "r_x2": 286.36508, "r_y2": 523.07632, "r_x3": 50.112015, "r_y3": 523.07632, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 543.93788, "r_x1": 286.36508, "r_y1": 543.93788, "r_x2": 286.36508, "r_y2": 535.0313100000001, "r_x3": 50.112015, "r_y3": 535.0313100000001, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 555.89288, "r_x1": 286.36511, "r_y1": 555.89288, "r_x2": 286.36511, "r_y2": 546.98633, "r_x3": 50.112015, "r_y3": 546.98633, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 567.84789, "r_x1": 286.36508, "r_y1": 567.84789, "r_x2": 286.36508, "r_y2": 558.94133, "r_x3": 50.112015, "r_y3": 558.94133, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 579.8028899999999, "r_x1": 286.36511, "r_y1": 579.8028899999999, "r_x2": 286.36511, "r_y2": 570.89633, "r_x3": 50.112015, "r_y3": 570.89633, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 591.75789, "r_x1": 286.36511, "r_y1": 591.75789, "r_x2": 286.36511, "r_y2": 582.85133, "r_x3": 50.112015, "r_y3": 582.85133, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 603.71388, "r_x1": 286.36505, "r_y1": 603.71388, "r_x2": 286.36505, "r_y2": 594.80733, "r_x3": 50.112015, "r_y3": 594.80733, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 615.6688800000001, "r_x1": 286.36508, "r_y1": 615.6688800000001, "r_x2": 286.36508, "r_y2": 606.76233, "r_x3": 50.112015, "r_y3": 606.76233, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 627.62389, "r_x1": 209.7527, "r_y1": 627.62389, "r_x2": 209.7527, "r_y2": 618.71733, "r_x3": 50.112015, "r_y3": 618.71733, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain." }, { "label": "text", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.112015, "t": 632.51433, "r": 286.36511, "b": 713.151894, "coord_origin": "TOPLEFT" }, "confidence": 0.9871614575386047, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067017, "r_y0": 641.42088, "r_x1": 286.36499, "r_y1": 641.42088, "r_x2": 286.36499, "r_y2": 632.51433, "r_x3": 62.067017, "r_y3": 632.51433, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 653.37589, "r_x1": 286.36508, "r_y1": 653.37589, "r_x2": 286.36508, "r_y2": 644.46933, "r_x3": 50.112015, "r_y3": 644.46933, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.33189, "r_x1": 286.36511, "r_y1": 665.33189, "r_x2": 286.36511, "r_y2": 656.42532, "r_x3": 50.112015, "r_y3": 656.42532, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28689, "r_x1": 286.36505, "r_y1": 677.28689, "r_x2": 286.36505, "r_y2": 668.38033, "r_x3": 50.112015, "r_y3": 668.38033, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24189, "r_x1": 286.36508, "r_y1": 689.24189, "r_x2": 286.36508, "r_y2": 680.33533, "r_x3": 50.112015, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.196892, "r_x1": 286.36508, "r_y1": 701.196892, "r_x2": 286.36508, "r_y2": 692.290329, "r_x3": 50.112015, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151894, "r_x1": 286.36511, "r_y1": 713.151894, "r_x2": 286.36511, "r_y2": 704.245331, "r_x3": 50.112015, "r_y3": 704.245331, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third" }, { "label": "table", "id": 8, "page_no": 3, "cluster": { "id": 8, "label": "table", "bbox": { "l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT" }, "confidence": 0.9777463674545288, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.332, "t": 73.61437999999998, "r": 430.90231, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.332, "r_y0": 82.52094, "r_x1": 430.90231, "r_y1": 82.52094, "r_x2": 430.90231, "r_y2": 73.61437999999998, "r_x3": 412.332, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.85742, "t": 73.61437999999998, "r": 464.4463799999999, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.85742, "r_y0": 82.52094, "r_x1": 464.4463799999999, "r_y1": 82.52094, "r_x2": 464.4463799999999, "r_y2": 73.61437999999998, "r_x3": 442.85742, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.78632, "t": 73.61437999999998, "r": 494.94193, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.78632, "r_y0": 82.52094, "r_x1": 494.94193, "r_y1": 82.52094, "r_x2": 494.94193, "r_y2": 73.61437999999998, "r_x3": 477.78632, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28186, "t": 73.61437999999998, "r": 536.91437, "b": 82.52094, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28186, "r_y0": 82.52094, "r_x1": 536.91437, "r_y1": 82.52094, "r_x2": 536.91437, "r_y2": 73.61437999999998, "r_x3": 508.28186, "r_y3": 73.61437999999998, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.9673499999999, "r": 361.64264, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87390000000005, "r_x1": 361.64264, "r_y1": 94.87390000000005, "r_x2": 361.64264, "r_y2": 85.9673499999999, "r_x3": 317.06, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.85599, "t": 85.6684600000001, "r": 425.37775, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 94.88385000000017, "r_x1": 425.37775, "r_y1": 94.88385000000017, "r_x2": 425.37775, "r_y2": 85.6684600000001, "r_x3": 417.85599, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.89569, "t": 85.6684600000001, "r": 457.41745000000003, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 94.88385000000017, "r_x1": 457.41745000000003, "r_y1": 94.88385000000017, "r_x2": 457.41745000000003, "r_y2": 85.6684600000001, "r_x3": 449.89569, "r_y3": 85.6684600000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.401, "t": 85.9673499999999, "r": 496.3262, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 94.87390000000005, "r_x1": 496.3262, "r_y1": 94.87390000000005, "r_x2": 496.3262, "r_y2": 85.9673499999999, "r_x3": 476.401, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63495, "t": 85.9673499999999, "r": 532.56012, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 94.87390000000005, "r_x1": 532.56012, "r_y1": 94.87390000000005, "r_x2": 532.56012, "r_y2": 85.9673499999999, "r_x3": 512.63495, "r_y3": 85.9673499999999, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92236000000003, "r": 359.43094, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.82892000000004, "r_x1": 359.43094, "r_y1": 106.82892000000004, "r_x2": 359.43094, "r_y2": 97.92236000000003, "r_x3": 317.06, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.85599, "t": 97.62347, "r": 425.37775, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 106.83887000000016, "r_x1": 425.37775, "r_y1": 106.83887000000016, "r_x2": 425.37775, "r_y2": 97.62347, "r_x3": 417.85599, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.89569, "t": 97.62347, "r": 457.41745000000003, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 106.83887000000016, "r_x1": 457.41745000000003, "r_y1": 106.83887000000016, "r_x2": 457.41745000000003, "r_y2": 97.62347, "r_x3": 449.89569, "r_y3": 97.62347, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.401, "t": 97.92236000000003, "r": 496.3262, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 106.82892000000004, "r_x1": 496.3262, "r_y1": 106.82892000000004, "r_x2": 496.3262, "r_y2": 97.92236000000003, "r_x3": 476.401, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46185, "t": 97.92236000000003, "r": 531.73328, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46185, "r_y0": 106.82892000000004, "r_x1": 531.73328, "r_y1": 106.82892000000004, "r_x2": 531.73328, "r_y2": 97.92236000000003, "r_x3": 513.46185, "r_y3": 97.92236000000003, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.87836000000004, "r": 359.97888, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78490999999997, "r_x1": 359.97888, "r_y1": 118.78490999999997, "r_x2": 359.97888, "r_y2": 109.87836000000004, "r_x3": 317.06, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.85599, "t": 109.57947000000001, "r": 425.37775, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 118.79485999999997, "r_x1": 425.37775, "r_y1": 118.79485999999997, "r_x2": 425.37775, "r_y2": 109.57947000000001, "r_x3": 417.85599, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81226, "t": 109.57947000000001, "r": 456.50091999999995, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81226, "r_y0": 118.79485999999997, "r_x1": 456.50091999999995, "r_y1": 118.79485999999997, "r_x2": 456.50091999999995, "r_y2": 109.57947000000001, "r_x3": 450.81226, "r_y3": 109.57947000000001, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.401, "t": 109.87836000000004, "r": 496.3262, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 118.78490999999997, "r_x1": 496.3262, "r_y1": 118.78490999999997, "r_x2": 496.3262, "r_y2": 109.87836000000004, "r_x3": 476.401, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25017999999994, "t": 109.87836000000004, "r": 533.94501, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25017999999994, "r_y0": 118.78490999999997, "r_x1": 533.94501, "r_y1": 118.78490999999997, "r_x2": 533.94501, "r_y2": 109.87836000000004, "r_x3": 511.25017999999994, "r_y3": 109.87836000000004, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83336999999995, "r": 400.37723, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.73992999999996, "r_x1": 400.37723, "r_y1": 130.73992999999996, "r_x2": 400.37723, "r_y2": 121.83336999999995, "r_x3": 317.06, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.85599, "t": 121.53448000000003, "r": 425.37775, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 130.74987999999996, "r_x1": 425.37775, "r_y1": 130.74987999999996, "r_x2": 425.37775, "r_y2": 121.53448000000003, "r_x3": 417.85599, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.89569, "t": 121.53448000000003, "r": 457.41745000000003, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 130.74987999999996, "r_x1": 457.41745000000003, "r_y1": 130.74987999999996, "r_x2": 457.41745000000003, "r_y2": 121.53448000000003, "r_x3": 449.89569, "r_y3": 121.53448000000003, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.401, "t": 121.83336999999995, "r": 496.3262, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 130.73992999999996, "r_x1": 496.3262, "r_y1": 130.73992999999996, "r_x2": 496.3262, "r_y2": 121.83336999999995, "r_x3": 476.401, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63495, "t": 121.83336999999995, "r": 532.56012, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 130.73992999999996, "r_x1": 532.56012, "r_y1": 130.73992999999996, "r_x2": 532.56012, "r_y2": 121.83336999999995, "r_x3": 512.63495, "r_y3": 121.83336999999995, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.78839000000005, "r": 375.17184, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69494999999995, "r_x1": 375.17184, "r_y1": 142.69494999999995, "r_x2": 375.17184, "r_y2": 133.78839000000005, "r_x3": 317.06, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.85599, "t": 133.48950000000002, "r": 425.37775, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 142.70489999999995, "r_x1": 425.37775, "r_y1": 142.70489999999995, "r_x2": 425.37775, "r_y2": 133.48950000000002, "r_x3": 417.85599, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.89569, "t": 133.48950000000002, "r": 457.41745000000003, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 142.70489999999995, "r_x1": 457.41745000000003, "r_y1": 142.70489999999995, "r_x2": 457.41745000000003, "r_y2": 133.48950000000002, "r_x3": 449.89569, "r_y3": 133.48950000000002, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.401, "t": 133.78839000000005, "r": 496.3262, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 142.69494999999995, "r_x1": 496.3262, "r_y1": 142.69494999999995, "r_x2": 496.3262, "r_y2": 133.78839000000005, "r_x3": 476.401, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63495, "t": 133.78839000000005, "r": 532.56012, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 142.69494999999995, "r_x1": 532.56012, "r_y1": 142.69494999999995, "r_x2": 532.56012, "r_y2": 133.78839000000005, "r_x3": 512.63495, "r_y3": 133.78839000000005, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74341000000004, "r": 369.39352, "b": 154.64995999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.64995999999996, "r_x1": 369.39352, "r_y1": 154.64995999999996, "r_x2": 369.39352, "r_y2": 145.74341000000004, "r_x3": 317.06, "r_y3": 145.74341000000004, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.85599, "t": 145.44446000000005, "r": 425.37775, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.85599, "r_y0": 154.65985, "r_x1": 425.37775, "r_y1": 154.65985, "r_x2": 425.37775, "r_y2": 145.44446000000005, "r_x3": 417.85599, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.89569, "t": 145.44446000000005, "r": 457.41745000000003, "b": 154.65985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.89569, "r_y0": 154.65985, "r_x1": 457.41745000000003, "r_y1": 154.65985, "r_x2": 457.41745000000003, "r_y2": 145.44446000000005, "r_x3": 449.89569, "r_y3": 145.44446000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.401, "t": 145.74334999999996, "r": 496.3262, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.401, "r_y0": 154.6499, "r_x1": 496.3262, "r_y1": 154.6499, "r_x2": 496.3262, "r_y2": 145.74334999999996, "r_x3": 476.401, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63495, "t": 145.74334999999996, "r": 532.56012, "b": 154.6499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63495, "r_y0": 154.6499, "r_x1": 532.56012, "r_y1": 154.6499, "r_x2": 532.56012, "r_y2": 145.74334999999996, "r_x3": 512.63495, "r_y3": 145.74334999999996, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 412.332, "t": 73.61437999999998, "r": 430.90231, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 442.85742, "t": 73.61437999999998, "r": 464.4463799999999, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 477.78632, "t": 73.61437999999998, "r": 494.94193, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 508.28186, "t": 73.61437999999998, "r": 536.91437, "b": 82.52094, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 85.9673499999999, "r": 361.64264, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 85.6684600000001, "r": 425.37775, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 85.6684600000001, "r": 457.41745000000003, "b": 94.88385000000017, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 85.9673499999999, "r": 496.3262, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 85.9673499999999, "r": 532.56012, "b": 94.87390000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 97.92236000000003, "r": 359.43094, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 97.62347, "r": 425.37775, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 97.62347, "r": 457.41745000000003, "b": 106.83887000000016, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 97.92236000000003, "r": 496.3262, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.46185, "t": 97.92236000000003, "r": 531.73328, "b": 106.82892000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 109.87836000000004, "r": 359.97888, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 109.57947000000001, "r": 425.37775, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 450.81226, "t": 109.57947000000001, "r": 456.50091999999995, "b": 118.79485999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 109.87836000000004, "r": 496.3262, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 511.25017999999994, "t": 109.87836000000004, "r": 533.94501, "b": 118.78490999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 121.83336999999995, "r": 400.37723, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 121.53448000000003, "r": 425.37775, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 121.53448000000003, "r": 457.41745000000003, "b": 130.74987999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 121.83336999999995, "r": 496.3262, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 121.83336999999995, "r": 532.56012, "b": 130.73992999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 133.78839000000005, "r": 375.17184, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 133.48950000000002, "r": 425.37775, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 133.48950000000002, "r": 457.41745000000003, "b": 142.70489999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 133.78839000000005, "r": 496.3262, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 133.78839000000005, "r": 532.56012, "b": 142.69494999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 145.74341000000004, "r": 369.39352, "b": 154.64995999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.85599, "t": 145.44446000000005, "r": 425.37775, "b": 154.65985, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.89569, "t": 145.44446000000005, "r": 457.41745000000003, "b": 154.65985, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.401, "t": 145.74334999999996, "r": 496.3262, "b": 154.6499, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63495, "t": 145.74334999999996, "r": 532.56012, "b": 154.6499, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 9, "page_no": 3, "cluster": { "id": 9, "label": "caption", "bbox": { "l": 308.862, "t": 167.66138, "r": 545.11505, "b": 224.38897999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9667726755142212, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 176.56793000000005, "r_x1": 344.6178, "r_y1": 176.56793000000005, "r_x2": 344.6178, "r_y2": 167.66138, "r_x3": 308.862, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.07602, "r_y0": 176.56793000000005, "r_x1": 380.45328, "r_y1": 176.56793000000005, "r_x2": 380.45328, "r_y2": 167.66138, "r_x3": 361.07602, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.56799, "r_y0": 176.33880999999997, "r_x1": 468.67974999999996, "r_y1": 176.33880999999997, "r_x2": 468.67974999999996, "r_y2": 167.75104, "r_x3": 386.56799, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.79599, "r_y0": 176.56793000000005, "r_x1": 489.18198, "r_y1": 176.56793000000005, "r_x2": 489.18198, "r_y2": 167.66138, "r_x3": 474.79599, "r_y3": 167.66138, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.29898000000003, "r_y0": 176.33880999999997, "r_x1": 545.112, "r_y1": 176.33880999999997, "r_x2": 545.112, "r_y2": 167.75104, "r_x3": 495.29898000000003, "r_y3": 167.75104, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 188.29381999999998, "r_x1": 341.16077, "r_y1": 188.29381999999998, "r_x2": 341.16077, "r_y2": 179.70605, "r_x3": 308.862, "r_y3": 179.70605, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.457, "r_y0": 188.52295000000004, "r_x1": 545.11005, "r_y1": 188.52295000000004, "r_x2": 545.11005, "r_y2": 179.61639000000002, "r_x3": 343.457, "r_y3": 179.61639000000002, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 200.47797000000003, "r_x1": 545.11505, "r_y1": 200.47797000000003, "r_x2": 545.11505, "r_y2": 191.57141000000001, "r_x3": 308.862, "r_y3": 191.57141000000001, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 212.43298000000004, "r_x1": 545.11499, "r_y1": 212.43298000000004, "r_x2": 545.11499, "r_y2": 203.52643, "r_x3": 308.862, "r_y3": 203.52643, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 224.38897999999995, "r_x1": 523.93469, "r_y1": 224.38897999999995, "r_x2": 523.93469, "r_y2": 215.48242000000005, "r_x3": 308.862, "r_y3": 215.48242000000005, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank." }, { "label": "text", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "text", "bbox": { "l": 308.862, "t": 249.62041999999997, "r": 545.11517, "b": 294.39197, "coord_origin": "TOPLEFT" }, "confidence": 0.978954017162323, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.52698, "r_x1": 545.11517, "r_y1": 258.52698, "r_x2": 545.11517, "r_y2": 249.62041999999997, "r_x3": 308.862, "r_y3": 249.62041999999997, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.48199, "r_x1": 545.11517, "r_y1": 270.48199, "r_x2": 545.11517, "r_y2": 261.57543999999996, "r_x3": 308.862, "r_y3": 261.57543999999996, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.43698, "r_x1": 545.11505, "r_y1": 282.43698, "r_x2": 545.11505, "r_y2": 273.5304, "r_x3": 308.862, "r_y3": 273.5304, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.39197, "r_x1": 436.82169, "r_y1": 294.39197, "r_x2": 436.82169, "r_y2": 285.48541000000006, "r_x3": 308.862, "r_y3": 285.48541000000006, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples." }, { "label": "text", "id": 13, "page_no": 3, "cluster": { "id": 13, "label": "text", "bbox": { "l": 320.81699, "t": 297.77240000000006, "r": 542.74396, "b": 306.67896, "coord_origin": "TOPLEFT" }, "confidence": 0.9043695330619812, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 306.67896, "r_x1": 542.74396, "r_y1": 306.67896, "r_x2": 542.74396, "r_y2": 297.77240000000006, "r_x3": 320.81699, "r_y3": 297.77240000000006, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tab. 1 summarizes the various attributes of the datasets." }, { "label": "section_header", "id": 11, "page_no": 3, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 308.862, "t": 321.18396, "r": 444.93607000000003, "b": 331.93167000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9466595649719238, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 331.93167000000005, "r_x1": 316.28476, "r_y1": 331.93167000000005, "r_x2": 316.28476, "r_y2": 321.18396, "r_x3": 308.862, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18176, "r_y0": 331.93167000000005, "r_x1": 444.93607000000003, "r_y1": 331.93167000000005, "r_x2": 444.93607000000003, "r_y2": 321.18396, "r_x3": 326.18176, "r_y3": 321.18396, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. The TableFormer model" }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 341.93939, "r": 545.11523, "b": 446.48685000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.9884450435638428, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 350.84594999999996, "r_x1": 545.11499, "r_y1": 350.84594999999996, "r_x2": 545.11499, "r_y2": 341.93939, "r_x3": 320.81699, "r_y3": 341.93939, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 362.80092999999994, "r_x1": 545.11511, "r_y1": 362.80092999999994, "r_x2": 545.11511, "r_y2": 353.89438, "r_x3": 308.862, "r_y3": 353.89438, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 374.75592, "r_x1": 545.11517, "r_y1": 374.75592, "r_x2": 545.11517, "r_y2": 365.84937, "r_x3": 308.862, "r_y3": 365.84937, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 386.71091, "r_x1": 545.11505, "r_y1": 386.71091, "r_x2": 545.11505, "r_y2": 377.80435, "r_x3": 308.862, "r_y3": 377.80435, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 398.66588999999993, "r_x1": 545.11517, "r_y1": 398.66588999999993, "r_x2": 545.11517, "r_y2": 389.75934000000007, "r_x3": 308.862, "r_y3": 389.75934000000007, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 410.62088, "r_x1": 545.11523, "r_y1": 410.62088, "r_x2": 545.11523, "r_y2": 401.71432000000004, "r_x3": 308.862, "r_y3": 401.71432000000004, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 422.57687, "r_x1": 545.11517, "r_y1": 422.57687, "r_x2": 545.11517, "r_y2": 413.67032, "r_x3": 308.862, "r_y3": 413.67032, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 434.53186, "r_x1": 545.11505, "r_y1": 434.53186, "r_x2": 545.11505, "r_y2": 425.62531, "r_x3": 308.862, "r_y3": 425.62531, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 446.48685000000006, "r_x1": 437.9375, "r_y1": 446.48685000000006, "r_x2": 437.9375, "r_y2": 437.58029, "r_x3": 308.862, "r_y3": 437.58029, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required." }, { "label": "section_header", "id": 12, "page_no": 3, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 308.862, "t": 457.69427, "r": 420.16058, "b": 467.54633, "coord_origin": "TOPLEFT" }, "confidence": 0.937696099281311, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 467.54633, "r_x1": 323.14081, "r_y1": 467.54633, "r_x2": 323.14081, "r_y2": 457.69427, "r_x3": 308.862, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66003, "r_y0": 467.54633, "r_x1": 420.16058, "r_y1": 467.54633, "r_x2": 420.16058, "r_y2": 457.69427, "r_x3": 332.66003, "r_y3": 457.69427, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1. Model architecture." }, { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86197, "t": 476.76529, "r": 545.11572, "b": 664.99981, "coord_origin": "TOPLEFT" }, "confidence": 0.9878323078155518, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 485.67184, "r_x1": 545.11487, "r_y1": 485.67184, "r_x2": 545.11487, "r_y2": 476.76529, "r_x3": 320.81699, "r_y3": 476.76529, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.62683, "r_x1": 509.02054, "r_y1": 497.62683, "r_x2": 509.02054, "r_y2": 488.72028, "r_x3": 308.862, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.58588, "r_y0": 497.62683, "r_x1": 523.05786, "r_y1": 497.62683, "r_x2": 523.05786, "r_y2": 488.72028, "r_x3": 515.58588, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62323, "r_y0": 497.62683, "r_x1": 545.11505, "r_y1": 497.62683, "r_x2": 545.11505, "r_y2": 488.72028, "r_x3": 529.62323, "r_y3": 488.72028, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 509.35269, "r_x1": 406.34601, "r_y1": 509.35269, "r_x2": 406.34601, "r_y2": 500.76492, "r_x3": 308.862, "r_y3": 500.76492, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87201, "r_y0": 509.58182, "r_x1": 545.1106, "r_y1": 509.58182, "r_x2": 545.1106, "r_y2": 500.67526, "r_x3": 408.87201, "r_y3": 500.67526, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 521.53781, "r_x1": 409.39459, "r_y1": 521.53781, "r_x2": 409.39459, "r_y2": 512.63126, "r_x3": 308.862, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.72705, "r_y0": 521.53781, "r_x1": 545.11505, "r_y1": 521.53781, "r_x2": 545.11505, "r_y2": 512.63126, "r_x3": 416.72705, "r_y3": 512.63126, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.4928, "r_x1": 436.194, "r_y1": 533.4928, "r_x2": 436.194, "r_y2": 524.58624, "r_x3": 308.862, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.526, "r_y0": 533.26367, "r_x1": 513.86694, "r_y1": 533.26367, "r_x2": 513.86694, "r_y2": 524.6759, "r_x3": 439.526, "r_y3": 524.6759, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43201, "r_y0": 533.4928, "r_x1": 545.10815, "r_y1": 533.4928, "r_x2": 545.10815, "r_y2": 524.58624, "r_x3": 517.43201, "r_y3": 524.58624, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.4478, "r_x1": 545.11511, "r_y1": 545.4478, "r_x2": 545.11511, "r_y2": 536.54124, "r_x3": 308.862, "r_y3": 536.54124, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.4028000000001, "r_x1": 358.5455, "r_y1": 557.4028000000001, "r_x2": 358.5455, "r_y2": 548.49625, "r_x3": 308.862, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19055, "r_y0": 557.4028000000001, "r_x1": 545.11517, "r_y1": 557.4028000000001, "r_x2": 545.11517, "r_y2": 548.49625, "r_x3": 365.19055, "r_y3": 548.49625, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.3578, "r_x1": 352.40851, "r_y1": 569.3578, "r_x2": 352.40851, "r_y2": 560.45125, "r_x3": 308.862, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.409, "r_y0": 569.13863, "r_x1": 360.1579, "r_y1": 569.13863, "r_x2": 360.1579, "r_y2": 560.29184, "r_x3": 352.409, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.15799, "r_y0": 569.3578, "r_x1": 367.90891, "r_y1": 569.3578, "r_x2": 367.90891, "r_y2": 560.45125, "r_x3": 360.15799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.909, "r_y0": 569.13863, "r_x1": 375.6579, "r_y1": 569.13863, "r_x2": 375.6579, "r_y2": 560.29184, "r_x3": 367.909, "r_y3": 560.29184, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.65799, "r_y0": 569.3578, "r_x1": 545.11182, "r_y1": 569.3578, "r_x2": 545.11182, "r_y2": 560.45125, "r_x3": 375.65799, "r_y3": 560.45125, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.3138, "r_x1": 545.11499, "r_y1": 581.3138, "r_x2": 545.11499, "r_y2": 572.40724, "r_x3": 308.862, "r_y3": 572.40724, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.2688, "r_x1": 483.11768, "r_y1": 593.2688, "r_x2": 483.11768, "r_y2": 584.3622399999999, "r_x3": 308.862, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 593.04962, "r_x1": 490.86792, "r_y1": 593.04962, "r_x2": 490.86792, "r_y2": 584.20284, "r_x3": 483.11902, "r_y3": 584.20284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.86800999999997, "r_y0": 593.2688, "r_x1": 545.11438, "r_y1": 593.2688, "r_x2": 545.11438, "r_y2": 584.3622399999999, "r_x3": 490.86800999999997, "r_y3": 584.3622399999999, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.2238, "r_x1": 545.11493, "r_y1": 605.2238, "r_x2": 545.11493, "r_y2": 596.31725, "r_x3": 308.862, "r_y3": 596.31725, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.1788, "r_x1": 329.64395, "r_y1": 617.1788, "r_x2": 329.64395, "r_y2": 608.27225, "r_x3": 308.862, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.646, "r_y0": 616.9596300000001, "r_x1": 337.3949, "r_y1": 616.9596300000001, "r_x2": 337.3949, "r_y2": 608.11284, "r_x3": 329.646, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39398, "r_y0": 617.1788, "r_x1": 468.5914, "r_y1": 617.1788, "r_x2": 468.5914, "r_y2": 608.27225, "r_x3": 337.39398, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59496999999993, "r_y0": 616.9596300000001, "r_x1": 476.34387000000004, "r_y1": 616.9596300000001, "r_x2": 476.34387000000004, "r_y2": 608.11284, "r_x3": 468.59496999999993, "r_y3": 608.11284, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.3439599999999, "r_y0": 617.1788, "r_x1": 545.11572, "r_y1": 617.1788, "r_x2": 545.11572, "r_y2": 608.27225, "r_x3": 476.3439599999999, "r_y3": 608.27225, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 629.1338000000001, "r_x1": 545.11499, "r_y1": 629.1338000000001, "r_x2": 545.11499, "r_y2": 620.22725, "r_x3": 308.86197, "r_y3": 620.22725, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 641.08881, "r_x1": 545.11517, "r_y1": 641.08881, "r_x2": 545.11517, "r_y2": 632.1822500000001, "r_x3": 308.86197, "r_y3": 632.1822500000001, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 653.0448, "r_x1": 545.11511, "r_y1": 653.0448, "r_x2": 545.11511, "r_y2": 644.13824, "r_x3": 308.86197, "r_y3": 644.13824, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 664.99981, "r_x1": 449.42432, "r_y1": 664.99981, "r_x2": 449.42432, "r_y2": 656.09325, "r_x3": 308.86197, "r_y3": 656.09325, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification." }, { "label": "text", "id": 7, "page_no": 3, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.86197, "t": 668.2607, "r": 545.11511, "b": 713.1518169999999, "coord_origin": "TOPLEFT" }, "confidence": 0.978580117225647, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 677.21707, "r_x1": 431.90985, "r_y1": 677.21707, "r_x2": 431.90985, "r_y2": 668.2607, "r_x3": 320.81696, "r_y3": 668.2607, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.49896, "r_y0": 677.2868100000001, "r_x1": 545.11255, "r_y1": 677.2868100000001, "r_x2": 545.11255, "r_y2": 668.3802499999999, "r_x3": 439.49896, "r_y3": 668.3802499999999, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 689.24181, "r_x1": 545.11499, "r_y1": 689.24181, "r_x2": 545.11499, "r_y2": 680.33525, "r_x3": 308.86197, "r_y3": 680.33525, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 701.196815, "r_x1": 545.11511, "r_y1": 701.196815, "r_x2": 545.11511, "r_y2": 692.290253, "r_x3": 308.86197, "r_y3": 692.290253, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 713.1518169999999, "r_x1": 545.11505, "r_y1": 713.1518169999999, "r_x2": 545.11505, "r_y2": 704.245255, "r_x3": 308.86197, "r_y3": 704.245255, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-" } ], "headers": [ { "label": "page_footer", "id": 14, "page_no": 3, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.12097, "t": 734.133251, "r": 300.10226, "b": 743.039814, "coord_origin": "TOPLEFT" }, "confidence": 0.8565718531608582, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12097, "r_y0": 743.039814, "r_x1": 300.10226, "r_y1": 743.039814, "r_x2": 300.10226, "r_y2": 734.133251, "r_x3": 295.12097, "r_y3": 734.133251, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" } ] } }, { "page_no": 4, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 125.62891000000002, "r_x1": 84.927567, "r_y1": 125.62891000000002, "r_x2": 84.927567, "r_y2": 122.43970000000002, "r_x3": 81.688072, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 125.62891000000002, "r_x1": 93.026291, "r_y1": 125.62891000000002, "r_x2": 93.026291, "r_y2": 122.43970000000002, "r_x3": 86.54731, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.50498, "r_y0": 118.44135000000006, "r_x1": 115.3461, "r_y1": 118.44135000000006, "r_x2": 115.3461, "r_y2": 115.25214000000005, "r_x3": 102.50498, "r_y3": 115.25214000000005, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.140205, "r_y0": 118.40410999999995, "r_x1": 93.291527, "r_y1": 118.40410999999995, "r_x2": 93.291527, "r_y2": 115.21489999999994, "r_x3": 82.140205, "r_y3": 115.21489999999994, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 125.62891000000002, "r_x1": 104.3119, "r_y1": 125.62891000000002, "r_x2": 104.3119, "r_y2": 122.43970000000002, "r_x3": 96.748268, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 130.93291999999997, "r_x1": 102.42083, "r_y1": 130.93291999999997, "r_x2": 102.42083, "r_y2": 127.74370999999985, "r_x3": 96.748268, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 136.6449, "r_x1": 104.3119, "r_y1": 136.6449, "r_x2": 104.3119, "r_y2": 133.45569, "r_x3": 96.748268, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 142.35693000000003, "r_x1": 102.42083, "r_y1": 142.35693000000003, "r_x2": 102.42083, "r_y2": 139.16772000000003, "r_x3": 96.748268, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 125.62891000000002, "r_x1": 116.14391, "r_y1": 125.62891000000002, "r_x2": 116.14391, "r_y2": 122.43970000000002, "r_x3": 110.66107, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 130.93291999999997, "r_x1": 116.14391, "r_y1": 130.93291999999997, "r_x2": 116.14391, "r_y2": 127.74370999999985, "r_x3": 110.66107, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 136.6449, "r_x1": 116.14391, "r_y1": 136.6449, "r_x2": 116.14391, "r_y2": 133.45569, "r_x3": 110.66107, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 142.35693000000003, "r_x1": 116.14391, "r_y1": 142.35693000000003, "r_x2": 116.14391, "r_y2": 139.16772000000003, "r_x3": 110.66107, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 130.93291999999997, "r_x1": 84.927567, "r_y1": 130.93291999999997, "r_x2": 84.927567, "r_y2": 127.74370999999985, "r_x3": 81.688072, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 130.93291999999997, "r_x1": 93.026291, "r_y1": 130.93291999999997, "r_x2": 93.026291, "r_y2": 127.74370999999985, "r_x3": 86.54731, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 136.6449, "r_x1": 84.927567, "r_y1": 136.6449, "r_x2": 84.927567, "r_y2": 133.45569, "r_x3": 81.688072, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 136.6449, "r_x1": 93.026291, "r_y1": 136.6449, "r_x2": 93.026291, "r_y2": 133.45569, "r_x3": 86.54731, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 142.35693000000003, "r_x1": 84.927567, "r_y1": 142.35693000000003, "r_x2": 84.927567, "r_y2": 139.16772000000003, "r_x3": 81.688072, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 142.35693000000003, "r_x1": 93.026291, "r_y1": 142.35693000000003, "r_x2": 93.026291, "r_y2": 139.16772000000003, "r_x3": 86.54731, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.084389, "r_y0": 96.23798, "r_x1": 113.93649, "r_y1": 96.23798, "r_x2": 113.93649, "r_y2": 90.49738000000002, "r_x3": 88.084389, "r_y3": 90.49738000000002, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81002, "r_y0": 103.37798999999995, "r_x1": 119.21240000000002, "r_y1": 103.37798999999995, "r_x2": 119.21240000000002, "r_y2": 97.63738999999998, "r_x3": 82.81002, "r_y3": 97.63738999999998, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94247, "r_y0": 106.34295999999995, "r_x1": 180.01131, "r_y1": 106.34295999999995, "r_x2": 180.01131, "r_y2": 100.60235999999998, "r_x3": 143.94247, "r_y3": 100.60235999999998, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94064, "r_y0": 113.48297000000014, "r_x1": 172.0118, "r_y1": 113.48297000000014, "r_x2": 172.0118, "r_y2": 107.74237000000005, "r_x3": 151.94064, "r_y3": 107.74237000000005, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.76939000000002, "r_y0": 86.67156999999997, "r_x1": 266.39557, "r_y1": 86.67156999999997, "r_x2": 266.39557, "r_y2": 80.93096999999989, "r_x3": 251.76939000000002, "r_y3": 80.93096999999989, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 91.77161000000001, "r_x1": 270.65021, "r_y1": 91.77161000000001, "r_x2": 270.65021, "r_y2": 86.03101000000004, "r_x3": 247.51601, "r_y3": 86.03101000000004, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.03699, "r_y0": 84.30042000000003, "r_x1": 352.12589, "r_y1": 84.30042000000003, "r_x2": 352.12589, "r_y2": 78.55980999999997, "r_x3": 331.03699, "r_y3": 78.55980999999997, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56421, "r_y0": 101.77282999999989, "r_x1": 431.7261, "r_y1": 101.77282999999989, "r_x2": 431.7261, "r_y2": 96.03223000000003, "r_x3": 390.56421, "r_y3": 96.03223000000003, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82422, "r_y0": 107.89287999999999, "r_x1": 435.46966999999995, "r_y1": 107.89287999999999, "r_x2": 435.46966999999995, "r_y2": 102.15228000000013, "r_x3": 386.82422, "r_y3": 102.15228000000013, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.69589, "r_y0": 114.01288000000011, "r_x1": 433.6032400000001, "r_y1": 114.01288000000011, "r_x2": 433.6032400000001, "r_y2": 108.27228000000002, "r_x3": 388.69589, "r_y3": 108.27228000000002, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.07761, "r_y0": 120.13286999999991, "r_x1": 431.22542999999996, "r_y1": 120.13286999999991, "r_x2": 431.22542999999996, "r_y2": 114.39227000000005, "r_x3": 391.07761, "r_y3": 114.39227000000005, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.22650000000004, "r_y0": 157.42571999999996, "r_x1": 498.82068, "r_y1": 157.42571999999996, "r_x2": 498.82068, "r_y2": 151.68511999999998, "r_x3": 431.22650000000004, "r_y3": 151.68511999999998, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.1738, "r_y0": 163.54578000000004, "r_x1": 498.87753000000004, "r_y1": 163.54578000000004, "r_x2": 498.87753000000004, "r_y2": 157.80517999999995, "r_x3": 431.1738, "r_y3": 157.80517999999995, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.5289, "r_y0": 169.66576999999995, "r_x1": 489.51827999999995, "r_y1": 169.66576999999995, "r_x2": 489.51827999999995, "r_y2": 163.92516999999998, "r_x3": 440.5289, "r_y3": 163.92516999999998, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37479, "r_y0": 183.99445000000003, "r_x1": 367.72333, "r_y1": 183.99445000000003, "r_x2": 367.72333, "r_y2": 178.25385000000006, "r_x3": 328.37479, "r_y3": 178.25385000000006, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 129.64948000000015, "r_x1": 373.67963, "r_y1": 129.64948000000015, "r_x2": 373.67963, "r_y2": 123.90886999999998, "r_x3": 331.84451, "r_y3": 123.90886999999998, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 134.74945000000002, "r_x1": 381.17786, "r_y1": 134.74945000000002, "r_x2": 381.17786, "r_y2": 129.00885000000017, "r_x3": 331.84451, "r_y3": 129.00885000000017, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.62633, "r_y0": 93.85681, "r_x1": 219.42332, "r_y1": 93.85681, "r_x2": 219.42332, "r_y2": 88.11621000000002, "r_x3": 196.62633, "r_y3": 88.11621000000002, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.66771, "r_y0": 135.23528999999996, "r_x1": 271.49899, "r_y1": 135.23528999999996, "r_x2": 271.49899, "r_y2": 129.4946900000001, "r_x3": 246.66771, "r_y3": 129.4946900000001, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 140.33533, "r_x1": 270.65021, "r_y1": 140.33533, "r_x2": 270.65021, "r_y2": 134.59473000000003, "r_x3": 247.51601, "r_y3": 134.59473000000003, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 94.75982999999997, "r_x1": 365.55347, "r_y1": 94.75982999999997, "r_x2": 365.55347, "r_y2": 89.01923, "r_x3": 330.63071, "r_y3": 89.01923, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 102.91985999999997, "r_x1": 370.22717, "r_y1": 102.91985999999997, "r_x2": 370.22717, "r_y2": 97.17926, "r_x3": 330.63071, "r_y3": 97.17926, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 111.07983000000002, "r_x1": 374.51157, "r_y1": 111.07983000000002, "r_x2": 374.51157, "r_y2": 105.33922999999993, "r_x3": 330.63071, "r_y3": 105.33922999999993, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 119.23987, "r_x1": 335.73233, "r_y1": 119.23987, "r_x2": 335.73233, "r_y2": 113.49926999999991, "r_x3": 330.63071, "r_y3": 113.49926999999991, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 146.57617000000005, "r_x1": 335.05988, "r_y1": 146.57617000000005, "r_x2": 335.05988, "r_y2": 141.79236000000003, "r_x3": 322.30579, "r_y3": 141.79236000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 153.71613000000002, "r_x1": 335.05988, "r_y1": 153.71613000000002, "r_x2": 335.05988, "r_y2": 148.93231000000003, "r_x3": 322.30579, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.54971, "r_y0": 154.29638999999997, "r_x1": 340.95242, "r_y1": 154.29638999999997, "r_x2": 340.95242, "r_y2": 148.55579, "r_x3": 337.54971, "r_y3": 148.55579, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56262, "r_y0": 153.71613000000002, "r_x1": 398.91446, "r_y1": 153.71613000000002, "r_x2": 398.91446, "r_y2": 148.93231000000003, "r_x3": 343.56262, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.41718, "r_y0": 153.71613000000002, "r_x1": 421.58801, "r_y1": 153.71613000000002, "r_x2": 421.58801, "r_y2": 148.93231000000003, "r_x3": 407.41718, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 160.85613999999998, "r_x1": 349.23022, "r_y1": 160.85613999999998, "r_x2": 349.23022, "r_y2": 156.07232999999997, "r_x3": 322.30579, "r_y3": 156.07232999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 167.99614999999994, "r_x1": 335.05988, "r_y1": 167.99614999999994, "r_x2": 335.05988, "r_y2": 163.21234000000004, "r_x3": 322.30579, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56155, "r_y0": 167.99614999999994, "r_x1": 374.73685, "r_y1": 167.99614999999994, "r_x2": 374.73685, "r_y2": 163.21234000000004, "r_x3": 343.56155, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 175.13617, "r_x1": 326.55716, "r_y1": 175.13617, "r_x2": 326.55716, "r_y2": 170.35235999999998, "r_x3": 322.30579, "r_y3": 170.35235999999998, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51111, "r_y0": 95.41027999999994, "r_x1": 326.91382, "r_y1": 95.41027999999994, "r_x2": 326.91382, "r_y2": 89.66967999999997, "r_x3": 323.51111, "r_y3": 89.66967999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 103.52948000000004, "r_x1": 327.1178, "r_y1": 103.52948000000004, "r_x2": 327.1178, "r_y2": 97.78887999999995, "r_x3": 323.71509, "r_y3": 97.78887999999995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 111.73029000000008, "r_x1": 327.1178, "r_y1": 111.73029000000008, "r_x2": 327.1178, "r_y2": 105.98969, "r_x3": 323.71509, "r_y3": 105.98969, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.4816, "r_y0": 154.28687000000002, "r_x1": 404.88431, "r_y1": 154.28687000000002, "r_x2": 404.88431, "r_y2": 148.54625999999996, "r_x3": 401.4816, "r_y3": 148.54625999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.6976, "r_y0": 168.42511000000002, "r_x1": 341.10031, "r_y1": 168.42511000000002, "r_x2": 341.10031, "r_y2": 162.68451000000005, "r_x3": 337.6976, "r_y3": 162.68451000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46378, "r_y0": 110.28644000000008, "r_x1": 457.86648999999994, "r_y1": 110.28644000000008, "r_x2": 457.86648999999994, "r_y2": 104.54584, "r_x3": 454.46378, "r_y3": 104.54584, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.32580999999993, "r_y0": 96.83605999999997, "r_x1": 496.72852, "r_y1": 96.83605999999997, "r_x2": 496.72852, "r_y2": 91.09546, "r_x3": 493.32580999999993, "r_y3": 91.09546, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08298, "r_y0": 96.30939000000001, "r_x1": 457.48569000000003, "r_y1": 96.30939000000001, "r_x2": 457.48569000000003, "r_y2": 90.56879000000015, "r_x3": 454.08298, "r_y3": 90.56879000000015, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 213.01189999999997, "r_x1": 86.883949, "r_y1": 213.01189999999997, "r_x2": 86.883949, "r_y2": 204.10535000000004, "r_x3": 50.112, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.020996, "r_y0": 212.94214, "r_x1": 149.85141, "r_y1": 212.94214, "r_x2": 149.85141, "r_y2": 203.98577999999998, "r_x3": 94.020996, "r_y3": 203.98577999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86099, "r_y0": 213.01189999999997, "r_x1": 545.10846, "r_y1": 213.01189999999997, "r_x2": 545.10846, "r_y2": 204.10535000000004, "r_x3": 152.86099, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 224.96691999999996, "r_x1": 436.0134, "r_y1": 224.96691999999996, "r_x2": 436.0134, "r_y2": 216.06035999999995, "r_x3": 50.111992, "r_y3": 216.06035999999995, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.253464, "r_y0": 264.17474000000004, "r_x1": 101.75846, "r_y1": 264.17474000000004, "r_x2": 101.75846, "r_y2": 258.21472000000006, "r_x3": 74.253464, "r_y3": 258.21472000000006, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.29972, "r_y0": 264.30524, "r_x1": 157.83972, "r_y1": 264.30524, "r_x2": 157.83972, "r_y2": 258.34520999999995, "r_x3": 122.29972, "r_y3": 258.34520999999995, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.549347, "r_y0": 377.04782, "r_x1": 125.68359000000001, "r_y1": 377.04782, "r_x2": 125.68359000000001, "r_y2": 371.38579999999996, "r_x3": 78.549347, "r_y3": 371.38579999999996, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.513298, "r_y0": 396.98059, "r_x1": 84.644547, "r_y1": 396.98059, "r_x2": 84.644547, "r_y2": 391.31857, "r_x3": 78.513298, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.52705, "r_y0": 396.98059, "r_x1": 125.11079999999998, "r_y1": 396.98059, "r_x2": 125.11079999999998, "r_y2": 391.31857, "r_x3": 116.52705, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.024773, "r_y0": 430.11511, "r_x1": 127.92327000000002, "r_y1": 430.11511, "r_x2": 127.92327000000002, "r_y2": 424.45309, "r_x3": 76.024773, "r_y3": 424.45309, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.382828, "r_y0": 450.55157, "r_x1": 84.514076, "r_y1": 450.55157, "r_x2": 84.514076, "r_y2": 444.88956, "r_x3": 78.382828, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.39658, "r_y0": 450.55157, "r_x1": 124.98033, "r_y1": 450.55157, "r_x2": 124.98033, "r_y2": 444.88956, "r_x3": 116.39658, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.46945, "r_y0": 468.10526, "r_x1": 181.6292, "r_y1": 468.10526, "r_x2": 181.6292, "r_y2": 462.44324, "r_x3": 167.46945, "r_y3": 462.44324, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61292, "r_y0": 484.13309, "r_x1": 184.43242, "r_y1": 484.13309, "r_x2": 184.43242, "r_y2": 478.47107, "r_x3": 165.61292, "r_y3": 478.47107, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.319511, "r_y0": 330.22235000000006, "r_x1": 132.9245, "r_y1": 330.22235000000006, "r_x2": 132.9245, "r_y2": 324.26235999999994, "r_x3": 65.319511, "r_y3": 324.26235999999994, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51457, "r_y0": 274.72992, "r_x1": 162.98782, "r_y1": 274.72992, "r_x2": 162.98782, "r_y2": 269.66394, "r_x3": 119.51457, "r_y3": 269.66394, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.72858, "r_y0": 279.97992, "r_x1": 151.41083, "r_y1": 279.97992, "r_x2": 151.41083, "r_y2": 274.91394, "r_x3": 128.72858, "r_y3": 274.91394, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.434211999999995, "r_y0": 344.26993, "r_x1": 80.27021, "r_y1": 344.26993, "r_x2": 80.27021, "r_y2": 338.95993, "r_x3": 60.434211999999995, "r_y3": 338.95993, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.598457, "r_y0": 348.69604, "r_x1": 78.854958, "r_y1": 348.69604, "r_x2": 78.854958, "r_y2": 343.38605, "r_x3": 60.598457, "r_y3": 343.38605, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.82877, "r_y0": 298.68762, "r_x1": 154.66476, "r_y1": 298.68762, "r_x2": 154.66476, "r_y2": 293.37762, "r_x3": 134.82877, "r_y3": 293.37762, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99303, "r_y0": 303.11371, "r_x1": 153.24953, "r_y1": 303.11371, "r_x2": 153.24953, "r_y2": 297.80370999999997, "r_x3": 134.99303, "r_y3": 297.80370999999997, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 351.02063, "r_x1": 197.14943, "r_y1": 351.02063, "r_x2": 197.14943, "r_y2": 345.35861, "r_x3": 150.55193, "r_y3": 345.35861, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 400.08542, "r_x1": 156.68318, "r_y1": 400.08542, "r_x2": 156.68318, "r_y2": 394.4234, "r_x3": 150.55193, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 400.08542, "r_x1": 197.14943, "r_y1": 400.08542, "r_x2": 197.14943, "r_y2": 394.4234, "r_x3": 188.56567, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.18539, "r_y0": 381.33044, "r_x1": 197.31964, "r_y1": 381.33044, "r_x2": 197.31964, "r_y2": 375.66843, "r_x3": 150.18539, "r_y3": 375.66843, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 445.91049, "r_x1": 156.68318, "r_y1": 445.91049, "r_x2": 156.68318, "r_y2": 440.24847000000005, "r_x3": 150.55193, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 445.91049, "r_x1": 197.14943, "r_y1": 445.91049, "r_x2": 197.14943, "r_y2": 440.24847000000005, "r_x3": 188.56567, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86377, "r_y0": 427.75537, "r_x1": 199.76227, "r_y1": 427.75537, "r_x2": 199.76227, "r_y2": 422.09335, "r_x3": 147.86377, "r_y3": 422.09335, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.56567000000004, "r_y0": 319.92487, "r_x1": 255.72542, "r_y1": 319.92487, "r_x2": 255.72542, "r_y2": 314.26285000000007, "r_x3": 241.56567000000004, "r_y3": 314.26285000000007, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.91730000000004, "r_y0": 367.02695, "r_x1": 256.07706, "r_y1": 367.02695, "r_x2": 256.07706, "r_y2": 361.36493, "r_x3": 241.91730000000004, "r_y3": 361.36493, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.054, "r_y0": 342.28131, "r_x1": 248.72363000000004, "r_y1": 342.28131, "r_x2": 248.72363000000004, "r_y2": 336.61929000000003, "r_x3": 228.054, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.2919, "r_y0": 342.28131, "r_x1": 269.39325, "r_y1": 342.28131, "r_x2": 269.39325, "r_y2": 336.61929000000003, "r_x3": 246.2919, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.44568000000004, "r_y0": 410.80884, "r_x1": 238.73892, "r_y1": 410.80884, "r_x2": 238.73892, "r_y2": 405.14682, "r_x3": 228.44568000000004, "r_y3": 405.14682, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.29767, "r_y0": 410.86526, "r_x1": 271.77792, "r_y1": 410.86526, "r_x2": 271.77792, "r_y2": 405.2032500000001, "r_x3": 256.29767, "r_y3": 405.2032500000001, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.54543, "r_y0": 387.87546, "r_x1": 258.08942, "r_y1": 387.87546, "r_x2": 258.08942, "r_y2": 382.21344, "r_x3": 239.54543, "r_y3": 382.21344, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.14704100000001, "r_y0": 449.78326, "r_x1": 59.51152, "r_y1": 449.78326, "r_x2": 59.51152, "r_y2": 384.87183, "r_x3": 54.14704100000001, "r_y3": 384.87183, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.235424, "r_y0": 378.45421999999996, "r_x1": 59.30449699999999, "r_y1": 378.45421999999996, "r_x2": 59.30449699999999, "r_y2": 373.81232, "r_x3": 54.235424, "r_y3": 373.81232, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.295891, "r_y0": 490.36688, "r_x1": 122.16431, "r_y1": 490.36688, "r_x2": 122.16431, "r_y2": 484.53189, "r_x3": 85.295891, "r_y3": 484.53189, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.66599, "r_y0": 285.45572000000004, "r_x1": 265.3194, "r_y1": 285.45572000000004, "r_x2": 265.3194, "r_y2": 279.54607999999996, "r_x3": 229.66599, "r_y3": 279.54607999999996, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17369, "r_y0": 506.12943, "r_x1": 190.41711, "r_y1": 506.12943, "r_x2": 190.41711, "r_y2": 500.3031, "r_x3": 157.17369, "r_y3": 500.3031, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.81598999999997, "r_y0": 443.89206, "r_x1": 270.78442, "r_y1": 443.89206, "r_x2": 270.78442, "r_y2": 438.05542, "r_x3": 227.81598999999997, "r_y3": 438.05542, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.70262, "r_y0": 449.8904999999999, "r_x1": 263.51105, "r_y1": 449.8904999999999, "r_x2": 263.51105, "r_y2": 444.06183, "r_x3": 233.70262, "r_y3": 444.06183, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.74655, "r_y0": 298.75903, "r_x1": 212.16055, "r_y1": 298.75903, "r_x2": 212.16055, "r_y2": 293.39502, "r_x3": 184.74655, "r_y3": 293.39502, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91229, "r_y0": 304.50903, "r_x1": 216.74378999999996, "r_y1": 304.50903, "r_x2": 216.74378999999996, "r_y2": 299.14502, "r_x3": 178.91229, "r_y3": 299.14502, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.24574, "r_y0": 287.84817999999996, "r_x1": 198.89099, "r_y1": 287.84817999999996, "r_x2": 198.89099, "r_y2": 282.7822, "r_x3": 194.24574, "r_y3": 282.7822, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.45587, "r_y0": 277.82916, "r_x1": 276.47089, "r_y1": 277.82916, "r_x2": 276.47089, "r_y2": 271.86914, "r_x3": 221.45587, "r_y3": 271.86914, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65219, "r_y0": 329.10443, "r_x1": 197.29019, "r_y1": 329.10443, "r_x2": 197.29019, "r_y2": 323.44241, "r_x3": 151.65219, "r_y3": 323.44241, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43277, "r_y0": 335.10443, "r_x1": 184.19028, "r_y1": 335.10443, "r_x2": 184.19028, "r_y2": 329.44241, "r_x3": 163.43277, "r_y3": 329.44241, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 536.80893, "r_x1": 229.78752, "r_y1": 536.80893, "r_x2": 229.78752, "r_y2": 527.90237, "r_x3": 50.112, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.787, "r_y0": 536.7392, "r_x1": 267.76196, "r_y1": 536.7392, "r_x2": 267.76196, "r_y2": 527.7828099999999, "r_x3": 231.787, "r_y3": 527.7828099999999, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76401, "r_y0": 536.80893, "r_x1": 286.36169, "r_y1": 536.80893, "r_x2": 286.36169, "r_y2": 527.90237, "r_x3": 269.76401, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 548.76393, "r_x1": 286.36508, "r_y1": 548.76393, "r_x2": 286.36508, "r_y2": 539.85738, "r_x3": 50.112015, "r_y3": 539.85738, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 560.71992, "r_x1": 205.84735, "r_y1": 560.71992, "r_x2": 205.84735, "r_y2": 551.81337, "r_x3": 50.112015, "r_y3": 551.81337, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.01802, "r_y0": 560.6501900000001, "r_x1": 286.36392, "r_y1": 560.6501900000001, "r_x2": 286.36392, "r_y2": 551.69382, "r_x3": 208.01802, "r_y3": 551.69382, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 572.67493, "r_x1": 64.498009, "r_y1": 572.67493, "r_x2": 64.498009, "r_y2": 563.76837, "r_x3": 50.112015, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.165016, "r_y0": 572.60519, "r_x1": 151.31288, "r_y1": 572.60519, "r_x2": 151.31288, "r_y2": 563.64882, "r_x3": 68.165016, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31302, "r_y0": 572.67493, "r_x1": 153.80367, "r_y1": 572.67493, "r_x2": 153.80367, "r_y2": 563.76837, "r_x3": 151.31302, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.41884, "r_y0": 572.67493, "r_x1": 241.93283000000002, "r_y1": 572.67493, "r_x2": 241.93283000000002, "r_y2": 563.76837, "r_x3": 160.41884, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.59502, "r_y0": 572.60519, "r_x1": 286.362, "r_y1": 572.60519, "r_x2": 286.362, "r_y2": 563.64882, "r_x3": 245.59502, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 584.5602, "r_x1": 85.519089, "r_y1": 584.5602, "r_x2": 85.519089, "r_y2": 575.60382, "r_x3": 50.112015, "r_y3": 575.60382, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.623016, "r_y0": 584.6299300000001, "r_x1": 286.36072, "r_y1": 584.6299300000001, "r_x2": 286.36072, "r_y2": 575.7233699999999, "r_x3": 88.623016, "r_y3": 575.7233699999999, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 596.58493, "r_x1": 286.36511, "r_y1": 596.58493, "r_x2": 286.36511, "r_y2": 587.6783800000001, "r_x3": 50.112015, "r_y3": 587.6783800000001, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 608.53993, "r_x1": 286.36508, "r_y1": 608.53993, "r_x2": 286.36508, "r_y2": 599.63338, "r_x3": 50.112015, "r_y3": 599.63338, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 620.4949300000001, "r_x1": 240.43756000000002, "r_y1": 620.4949300000001, "r_x2": 240.43756000000002, "r_y2": 611.58838, "r_x3": 50.112015, "r_y3": 611.58838, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.19801, "r_y0": 620.4252, "r_x1": 286.36597, "r_y1": 620.4252, "r_x2": 286.36597, "r_y2": 611.46883, "r_x3": 243.19801, "r_y3": 611.46883, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 632.3812, "r_x1": 286.36511, "r_y1": 632.3812, "r_x2": 286.36511, "r_y2": 623.42482, "r_x3": 50.112015, "r_y3": 623.42482, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 644.3362, "r_x1": 286.36508, "r_y1": 644.3362, "r_x2": 286.36508, "r_y2": 635.37982, "r_x3": 50.112015, "r_y3": 635.37982, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 656.36093, "r_x1": 220.58205, "r_y1": 656.36093, "r_x2": 220.58205, "r_y2": 647.45438, "r_x3": 50.112015, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.57802000000004, "r_y0": 656.14175, "r_x1": 228.32693, "r_y1": 656.14175, "r_x2": 228.32693, "r_y2": 647.29497, "r_x3": 220.57802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.32700999999997, "r_y0": 656.36093, "r_x1": 236.07791000000003, "r_y1": 656.36093, "r_x2": 236.07791000000003, "r_y2": 647.45438, "r_x3": 228.32700999999997, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.07802000000004, "r_y0": 656.14175, "r_x1": 243.82693, "r_y1": 656.14175, "r_x2": 243.82693, "r_y2": 647.29497, "r_x3": 236.07802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.82602, "r_y0": 656.36093, "r_x1": 255.29298000000003, "r_y1": 656.36093, "r_x2": 255.29298000000003, "r_y2": 647.45438, "r_x3": 243.82602, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29102000000003, "r_y0": 656.14175, "r_x1": 263.03992, "r_y1": 656.14175, "r_x2": 263.03992, "r_y2": 647.29497, "r_x3": 255.29102000000003, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04001, "r_y0": 656.36093, "r_x1": 286.36246, "r_y1": 656.36093, "r_x2": 286.36246, "r_y2": 647.45438, "r_x3": 263.04001, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 668.31594, "r_x1": 286.36511, "r_y1": 668.31594, "r_x2": 286.36511, "r_y2": 659.40938, "r_x3": 50.112015, "r_y3": 659.40938, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 680.27094, "r_x1": 218.46996, "r_y1": 680.27094, "r_x2": 218.46996, "r_y2": 671.36438, "r_x3": 50.112015, "r_y3": 671.36438, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.44097999999997, "r_x1": 523.05786, "r_y1": 258.44097999999997, "r_x2": 523.05786, "r_y2": 249.53441999999995, "r_x3": 308.862, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.19983, "r_y0": 258.44097999999997, "r_x1": 545.11505, "r_y1": 258.44097999999997, "r_x2": 545.11505, "r_y2": 249.53441999999995, "r_x3": 525.19983, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.39697, "r_x1": 517.55847, "r_y1": 270.39697, "r_x2": 517.55847, "r_y2": 261.49042, "r_x3": 308.862, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 270.39697, "r_x1": 545.11499, "r_y1": 270.39697, "r_x2": 545.11499, "r_y2": 261.49042, "r_x3": 520.76642, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.35196, "r_x1": 534.80377, "r_y1": 282.35196, "r_x2": 534.80377, "r_y2": 273.44537, "r_x3": 308.862, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36414, "r_y0": 282.35196, "r_x1": 545.11505, "r_y1": 282.35196, "r_x2": 545.11505, "r_y2": 273.44537, "r_x3": 537.36414, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.3069499999999, "r_x1": 341.24045, "r_y1": 294.3069499999999, "r_x2": 341.24045, "r_y2": 285.40039, "r_x3": 308.862, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73099, "r_y0": 294.07782000000003, "r_x1": 417.23508, "r_y1": 294.07782000000003, "r_x2": 417.23508, "r_y2": 285.49005, "r_x3": 343.73099, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23398, "r_y0": 294.3069499999999, "r_x1": 436.60129, "r_y1": 294.3069499999999, "r_x2": 436.60129, "r_y2": 285.40039, "r_x3": 417.23398, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09198, "r_y0": 294.07782000000003, "r_x1": 516.56116, "r_y1": 294.07782000000003, "r_x2": 516.56116, "r_y2": 285.49005, "r_x3": 439.09198, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56097, "r_y0": 294.3069499999999, "r_x1": 519.05164, "r_y1": 294.3069499999999, "r_x2": 519.05164, "r_y2": 285.40039, "r_x3": 516.56097, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 306.2962, "r_x1": 400.86649, "r_y1": 306.2962, "r_x2": 400.86649, "r_y2": 297.33981, "r_x3": 320.81696, "r_y3": 297.33981, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91394, "r_y0": 306.36594, "r_x1": 528.33685, "r_y1": 306.36594, "r_x2": 528.33685, "r_y2": 297.45938, "r_x3": 403.91394, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.7179, "r_y0": 306.36594, "r_x1": 545.11383, "r_y1": 306.36594, "r_x2": 545.11383, "r_y2": 297.45938, "r_x3": 530.7179, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 318.32092, "r_x1": 517.5285, "r_y1": 318.32092, "r_x2": 517.5285, "r_y2": 309.41437, "r_x3": 308.86194, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09387, "r_y0": 318.32092, "r_x1": 545.11493, "r_y1": 318.32092, "r_x2": 545.11493, "r_y2": 309.41437, "r_x3": 524.09387, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 330.27591, "r_x1": 432.35833999999994, "r_y1": 330.27591, "r_x2": 432.35833999999994, "r_y2": 321.36934999999994, "r_x3": 308.86194, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.81995000000006, "r_y0": 330.04678, "r_x1": 510.29041, "r_y1": 330.04678, "r_x2": 510.29041, "r_y2": 321.45901, "r_x3": 435.81995000000006, "r_y3": 321.45901, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.97797, "r_y0": 330.27591, "r_x1": 520.62305, "r_y1": 330.27591, "r_x2": 520.62305, "r_y2": 321.36934999999994, "r_x3": 513.97797, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08008, "r_y0": 330.27591, "r_x1": 545.11115, "r_y1": 330.27591, "r_x2": 545.11115, "r_y2": 321.36934999999994, "r_x3": 524.08008, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 342.2309, "r_x1": 527.76013, "r_y1": 342.2309, "r_x2": 527.76013, "r_y2": 333.32434, "r_x3": 308.86197, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.729, "r_y0": 342.2309, "r_x1": 545.11499, "r_y1": 342.2309, "r_x2": 545.11499, "r_y2": 333.32434, "r_x3": 530.729, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 354.18588, "r_x1": 526.85352, "r_y1": 354.18588, "r_x2": 526.85352, "r_y2": 345.27933, "r_x3": 308.86197, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62311, "r_y0": 354.18588, "r_x1": 545.11493, "r_y1": 354.18588, "r_x2": 545.11493, "r_y2": 345.27933, "r_x3": 529.62311, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 366.14188, "r_x1": 524.51245, "r_y1": 366.14188, "r_x2": 524.51245, "r_y2": 357.23532, "r_x3": 308.86197, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.96948, "r_y0": 366.14188, "r_x1": 545.11511, "r_y1": 366.14188, "r_x2": 545.11511, "r_y2": 357.23532, "r_x3": 527.96948, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 378.09685999999994, "r_x1": 370.39096, "r_y1": 378.09685999999994, "r_x2": 370.39096, "r_y2": 369.19031000000007, "r_x3": 308.86197, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44449, "r_y0": 378.09685999999994, "r_x1": 526.91339, "r_y1": 378.09685999999994, "r_x2": 526.91339, "r_y2": 369.19031000000007, "r_x3": 377.44449, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72906, "r_y0": 378.09685999999994, "r_x1": 545.11505, "r_y1": 378.09685999999994, "r_x2": 545.11505, "r_y2": 369.19031000000007, "r_x3": 530.72906, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 390.05185, "r_x1": 505.46395999999993, "r_y1": 390.05185, "r_x2": 505.46395999999993, "r_y2": 381.14529000000005, "r_x3": 308.86197, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03430000000003, "r_y0": 390.05185, "r_x1": 545.11511, "r_y1": 390.05185, "r_x2": 545.11511, "r_y2": 381.14529000000005, "r_x3": 508.03430000000003, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 402.00684, "r_x1": 517.68799, "r_y1": 402.00684, "r_x2": 517.68799, "r_y2": 393.10028, "r_x3": 308.86197, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 402.00684, "r_x1": 545.11499, "r_y1": 402.00684, "r_x2": 545.11499, "r_y2": 393.10028, "r_x3": 520.76642, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 413.96182, "r_x1": 528.01935, "r_y1": 413.96182, "r_x2": 528.01935, "r_y2": 405.05526999999995, "r_x3": 308.86197, "r_y3": 405.05526999999995, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 426.02081, "r_x1": 515.49609, "r_y1": 426.02081, "r_x2": 515.49609, "r_y2": 417.11426, "r_x3": 320.81696, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.7663, "r_y0": 426.02081, "r_x1": 545.11487, "r_y1": 426.02081, "r_x2": 545.11487, "r_y2": 417.11426, "r_x3": 520.7663, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 437.9758, "r_x1": 343.72107, "r_y1": 437.9758, "r_x2": 343.72107, "r_y2": 429.0692399999999, "r_x3": 308.86197, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.03796, "r_y0": 437.74667, "r_x1": 446.45471000000003, "r_y1": 437.74667, "r_x2": 446.45471000000003, "r_y2": 429.15891, "r_x3": 347.03796, "r_y3": 429.15891, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.93996999999996, "r_y0": 437.9758, "r_x1": 503.06055000000003, "r_y1": 437.9758, "r_x2": 503.06055000000003, "r_y2": 429.0692399999999, "r_x3": 449.93996999999996, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.37808, "r_y0": 437.9758, "r_x1": 537.3717, "r_y1": 437.9758, "r_x2": 537.3717, "r_y2": 429.0692399999999, "r_x3": 506.37808, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.68927, "r_y0": 437.9758, "r_x1": 545.11267, "r_y1": 437.9758, "r_x2": 545.11267, "r_y2": 429.0692399999999, "r_x3": 540.68927, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 449.93079, "r_x1": 522.78894, "r_y1": 449.93079, "r_x2": 522.78894, "r_y2": 441.02423, "r_x3": 308.86197, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.7478, "r_y0": 449.93079, "r_x1": 545.11511, "r_y1": 449.93079, "r_x2": 545.11511, "r_y2": 441.02423, "r_x3": 525.7478, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 461.88577, "r_x1": 384.14929, "r_y1": 461.88577, "r_x2": 384.14929, "r_y2": 452.97922, "r_x3": 308.86197, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37466, "r_y0": 461.88577, "r_x1": 527.84985, "r_y1": 461.88577, "r_x2": 527.84985, "r_y2": 452.97922, "r_x3": 393.37466, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39282, "r_y0": 461.88577, "r_x1": 545.11505, "r_y1": 461.88577, "r_x2": 545.11505, "r_y2": 452.97922, "r_x3": 532.39282, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 473.84177, "r_x1": 529.7627, "r_y1": 473.84177, "r_x2": 529.7627, "r_y2": 464.93521, "r_x3": 308.86197, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94073, "r_y0": 473.84177, "r_x1": 545.11505, "r_y1": 473.84177, "r_x2": 545.11505, "r_y2": 464.93521, "r_x3": 532.94073, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 485.79675, "r_x1": 514.17126, "r_y1": 485.79675, "r_x2": 514.17126, "r_y2": 476.8902, "r_x3": 308.86197, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89105, "r_y0": 485.79675, "r_x1": 545.11511, "r_y1": 485.79675, "r_x2": 545.11511, "r_y2": 476.8902, "r_x3": 516.89105, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.75174, "r_x1": 527.63068, "r_y1": 497.75174, "r_x2": 527.63068, "r_y2": 488.84518, "r_x3": 308.86197, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62317, "r_y0": 497.75174, "r_x1": 545.11499, "r_y1": 497.75174, "r_x2": 545.11499, "r_y2": 488.84518, "r_x3": 529.62317, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.70673, "r_x1": 508.3630999999999, "r_y1": 509.70673, "r_x2": 508.3630999999999, "r_y2": 500.80017, "r_x3": 308.86197, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09286000000003, "r_y0": 509.70673, "r_x1": 545.11511, "r_y1": 509.70673, "r_x2": 545.11511, "r_y2": 500.80017, "r_x3": 511.09286000000003, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.6617100000001, "r_x1": 545.11499, "r_y1": 521.6617100000001, "r_x2": 545.11499, "r_y2": 512.7551599999999, "r_x3": 308.86197, "r_y3": 512.7551599999999, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.61771, "r_x1": 545.11511, "r_y1": 533.61771, "r_x2": 545.11511, "r_y2": 524.71115, "r_x3": 308.86197, "r_y3": 524.71115, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.57271, "r_x1": 369.73349, "r_y1": 545.57271, "r_x2": 369.73349, "r_y2": 536.66615, "r_x3": 308.86197, "r_y3": 536.66615, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 557.56097, "r_x1": 404.76184, "r_y1": 557.56097, "r_x2": 404.76184, "r_y2": 548.6046, "r_x3": 320.81696, "r_y3": 548.6046, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34094, "r_y0": 557.63071, "r_x1": 545.11505, "r_y1": 557.63071, "r_x2": 545.11505, "r_y2": 548.72415, "r_x3": 410.34094, "r_y3": 548.72415, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 569.5867000000001, "r_x1": 545.11493, "r_y1": 569.5867000000001, "r_x2": 545.11493, "r_y2": 560.68015, "r_x3": 308.86194, "r_y3": 560.68015, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 581.5417, "r_x1": 545.11511, "r_y1": 581.5417, "r_x2": 545.11511, "r_y2": 572.6351500000001, "r_x3": 308.86194, "r_y3": 572.6351500000001, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 593.4967, "r_x1": 545.11493, "r_y1": 593.4967, "r_x2": 545.11493, "r_y2": 584.59015, "r_x3": 308.86194, "r_y3": 584.59015, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 605.45171, "r_x1": 545.11499, "r_y1": 605.45171, "r_x2": 545.11499, "r_y2": 596.54515, "r_x3": 308.86194, "r_y3": 596.54515, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 617.40671, "r_x1": 545.11505, "r_y1": 617.40671, "r_x2": 545.11505, "r_y2": 608.50015, "r_x3": 308.86194, "r_y3": 608.50015, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 629.36171, "r_x1": 545.11505, "r_y1": 629.36171, "r_x2": 545.11505, "r_y2": 620.45515, "r_x3": 308.86194, "r_y3": 620.45515, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 641.3177000000001, "r_x1": 381.67859, "r_y1": 641.3177000000001, "r_x2": 381.67859, "r_y2": 632.41115, "r_x3": 308.86194, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.99695, "r_y0": 641.09853, "r_x1": 391.74585, "r_y1": 641.09853, "r_x2": 391.74585, "r_y2": 632.25174, "r_x3": 383.99695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.74594, "r_y0": 641.3177000000001, "r_x1": 399.49686, "r_y1": 641.3177000000001, "r_x2": 399.49686, "r_y2": 632.41115, "r_x3": 391.74594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.49695, "r_y0": 641.09853, "r_x1": 407.24585, "r_y1": 641.09853, "r_x2": 407.24585, "r_y2": 632.25174, "r_x3": 399.49695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.24594, "r_y0": 641.3177000000001, "r_x1": 432.90958, "r_y1": 641.3177000000001, "r_x2": 432.90958, "r_y2": 632.41115, "r_x3": 407.24594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.90792999999996, "r_y0": 641.09853, "r_x1": 440.65683000000007, "r_y1": 641.09853, "r_x2": 440.65683000000007, "r_y2": 632.25174, "r_x3": 432.90792999999996, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.65691999999996, "r_y0": 641.3177000000001, "r_x1": 545.11475, "r_y1": 641.3177000000001, "r_x2": 545.11475, "r_y2": 632.41115, "r_x3": 440.65691999999996, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 653.27271, "r_x1": 398.96371, "r_y1": 653.27271, "r_x2": 398.96371, "r_y2": 644.3661500000001, "r_x3": 308.86194, "r_y3": 644.3661500000001, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81693, "r_y0": 665.33172, "r_x1": 444.34316999999993, "r_y1": 665.33172, "r_x2": 444.34316999999993, "r_y2": 656.42516, "r_x3": 320.81693, "r_y3": 656.42516, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.00591999999995, "r_y0": 665.10258, "r_x1": 545.1076, "r_y1": 665.10258, "r_x2": 545.1076, "r_y2": 656.51482, "r_x3": 447.00591999999995, "r_y3": 656.51482, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 677.2867200000001, "r_x1": 545.11505, "r_y1": 677.2867200000001, "r_x2": 545.11505, "r_y2": 668.38016, "r_x3": 308.86194, "r_y3": 668.38016, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 689.24172, "r_x1": 545.11505, "r_y1": 689.24172, "r_x2": 545.11505, "r_y2": 680.33516, "r_x3": 308.86194, "r_y3": 680.33516, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 701.196724, "r_x1": 545.11505, "r_y1": 701.196724, "r_x2": 545.11505, "r_y2": 692.290161, "r_x3": 308.86194, "r_y3": 692.290161, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 713.151726, "r_x1": 545.11505, "r_y1": 713.151726, "r_x2": 545.11505, "r_y2": 704.245163, "r_x3": 308.86194, "r_y3": 704.245163, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12094, "r_y0": 743.039722, "r_x1": 300.10223, "r_y1": 743.039722, "r_x2": 300.10223, "r_y2": 734.13316, "r_x3": 295.12094, "r_y3": 734.13316, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "picture", "bbox": { "l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT" }, "confidence": 0.9296807646751404, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 125.62891000000002, "r_x1": 84.927567, "r_y1": 125.62891000000002, "r_x2": 84.927567, "r_y2": 122.43970000000002, "r_x3": 81.688072, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 125.62891000000002, "r_x1": 93.026291, "r_y1": 125.62891000000002, "r_x2": 93.026291, "r_y2": 122.43970000000002, "r_x3": 86.54731, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.50498, "r_y0": 118.44135000000006, "r_x1": 115.3461, "r_y1": 118.44135000000006, "r_x2": 115.3461, "r_y2": 115.25214000000005, "r_x3": 102.50498, "r_y3": 115.25214000000005, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.140205, "r_y0": 118.40410999999995, "r_x1": 93.291527, "r_y1": 118.40410999999995, "r_x2": 93.291527, "r_y2": 115.21489999999994, "r_x3": 82.140205, "r_y3": 115.21489999999994, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 125.62891000000002, "r_x1": 104.3119, "r_y1": 125.62891000000002, "r_x2": 104.3119, "r_y2": 122.43970000000002, "r_x3": 96.748268, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 130.93291999999997, "r_x1": 102.42083, "r_y1": 130.93291999999997, "r_x2": 102.42083, "r_y2": 127.74370999999985, "r_x3": 96.748268, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 136.6449, "r_x1": 104.3119, "r_y1": 136.6449, "r_x2": 104.3119, "r_y2": 133.45569, "r_x3": 96.748268, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 142.35693000000003, "r_x1": 102.42083, "r_y1": 142.35693000000003, "r_x2": 102.42083, "r_y2": 139.16772000000003, "r_x3": 96.748268, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 125.62891000000002, "r_x1": 116.14391, "r_y1": 125.62891000000002, "r_x2": 116.14391, "r_y2": 122.43970000000002, "r_x3": 110.66107, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 130.93291999999997, "r_x1": 116.14391, "r_y1": 130.93291999999997, "r_x2": 116.14391, "r_y2": 127.74370999999985, "r_x3": 110.66107, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 136.6449, "r_x1": 116.14391, "r_y1": 136.6449, "r_x2": 116.14391, "r_y2": 133.45569, "r_x3": 110.66107, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 142.35693000000003, "r_x1": 116.14391, "r_y1": 142.35693000000003, "r_x2": 116.14391, "r_y2": 139.16772000000003, "r_x3": 110.66107, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 130.93291999999997, "r_x1": 84.927567, "r_y1": 130.93291999999997, "r_x2": 84.927567, "r_y2": 127.74370999999985, "r_x3": 81.688072, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 130.93291999999997, "r_x1": 93.026291, "r_y1": 130.93291999999997, "r_x2": 93.026291, "r_y2": 127.74370999999985, "r_x3": 86.54731, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 136.6449, "r_x1": 84.927567, "r_y1": 136.6449, "r_x2": 84.927567, "r_y2": 133.45569, "r_x3": 81.688072, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 136.6449, "r_x1": 93.026291, "r_y1": 136.6449, "r_x2": 93.026291, "r_y2": 133.45569, "r_x3": 86.54731, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 142.35693000000003, "r_x1": 84.927567, "r_y1": 142.35693000000003, "r_x2": 84.927567, "r_y2": 139.16772000000003, "r_x3": 81.688072, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 142.35693000000003, "r_x1": 93.026291, "r_y1": 142.35693000000003, "r_x2": 93.026291, "r_y2": 139.16772000000003, "r_x3": 86.54731, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.084389, "r_y0": 96.23798, "r_x1": 113.93649, "r_y1": 96.23798, "r_x2": 113.93649, "r_y2": 90.49738000000002, "r_x3": 88.084389, "r_y3": 90.49738000000002, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81002, "r_y0": 103.37798999999995, "r_x1": 119.21240000000002, "r_y1": 103.37798999999995, "r_x2": 119.21240000000002, "r_y2": 97.63738999999998, "r_x3": 82.81002, "r_y3": 97.63738999999998, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94247, "r_y0": 106.34295999999995, "r_x1": 180.01131, "r_y1": 106.34295999999995, "r_x2": 180.01131, "r_y2": 100.60235999999998, "r_x3": 143.94247, "r_y3": 100.60235999999998, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94064, "r_y0": 113.48297000000014, "r_x1": 172.0118, "r_y1": 113.48297000000014, "r_x2": 172.0118, "r_y2": 107.74237000000005, "r_x3": 151.94064, "r_y3": 107.74237000000005, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.76939000000002, "r_y0": 86.67156999999997, "r_x1": 266.39557, "r_y1": 86.67156999999997, "r_x2": 266.39557, "r_y2": 80.93096999999989, "r_x3": 251.76939000000002, "r_y3": 80.93096999999989, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 91.77161000000001, "r_x1": 270.65021, "r_y1": 91.77161000000001, "r_x2": 270.65021, "r_y2": 86.03101000000004, "r_x3": 247.51601, "r_y3": 86.03101000000004, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.03699, "r_y0": 84.30042000000003, "r_x1": 352.12589, "r_y1": 84.30042000000003, "r_x2": 352.12589, "r_y2": 78.55980999999997, "r_x3": 331.03699, "r_y3": 78.55980999999997, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56421, "r_y0": 101.77282999999989, "r_x1": 431.7261, "r_y1": 101.77282999999989, "r_x2": 431.7261, "r_y2": 96.03223000000003, "r_x3": 390.56421, "r_y3": 96.03223000000003, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82422, "r_y0": 107.89287999999999, "r_x1": 435.46966999999995, "r_y1": 107.89287999999999, "r_x2": 435.46966999999995, "r_y2": 102.15228000000013, "r_x3": 386.82422, "r_y3": 102.15228000000013, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.69589, "r_y0": 114.01288000000011, "r_x1": 433.6032400000001, "r_y1": 114.01288000000011, "r_x2": 433.6032400000001, "r_y2": 108.27228000000002, "r_x3": 388.69589, "r_y3": 108.27228000000002, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.07761, "r_y0": 120.13286999999991, "r_x1": 431.22542999999996, "r_y1": 120.13286999999991, "r_x2": 431.22542999999996, "r_y2": 114.39227000000005, "r_x3": 391.07761, "r_y3": 114.39227000000005, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.22650000000004, "r_y0": 157.42571999999996, "r_x1": 498.82068, "r_y1": 157.42571999999996, "r_x2": 498.82068, "r_y2": 151.68511999999998, "r_x3": 431.22650000000004, "r_y3": 151.68511999999998, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.1738, "r_y0": 163.54578000000004, "r_x1": 498.87753000000004, "r_y1": 163.54578000000004, "r_x2": 498.87753000000004, "r_y2": 157.80517999999995, "r_x3": 431.1738, "r_y3": 157.80517999999995, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.5289, "r_y0": 169.66576999999995, "r_x1": 489.51827999999995, "r_y1": 169.66576999999995, "r_x2": 489.51827999999995, "r_y2": 163.92516999999998, "r_x3": 440.5289, "r_y3": 163.92516999999998, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37479, "r_y0": 183.99445000000003, "r_x1": 367.72333, "r_y1": 183.99445000000003, "r_x2": 367.72333, "r_y2": 178.25385000000006, "r_x3": 328.37479, "r_y3": 178.25385000000006, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 129.64948000000015, "r_x1": 373.67963, "r_y1": 129.64948000000015, "r_x2": 373.67963, "r_y2": 123.90886999999998, "r_x3": 331.84451, "r_y3": 123.90886999999998, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 134.74945000000002, "r_x1": 381.17786, "r_y1": 134.74945000000002, "r_x2": 381.17786, "r_y2": 129.00885000000017, "r_x3": 331.84451, "r_y3": 129.00885000000017, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.62633, "r_y0": 93.85681, "r_x1": 219.42332, "r_y1": 93.85681, "r_x2": 219.42332, "r_y2": 88.11621000000002, "r_x3": 196.62633, "r_y3": 88.11621000000002, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.66771, "r_y0": 135.23528999999996, "r_x1": 271.49899, "r_y1": 135.23528999999996, "r_x2": 271.49899, "r_y2": 129.4946900000001, "r_x3": 246.66771, "r_y3": 129.4946900000001, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 140.33533, "r_x1": 270.65021, "r_y1": 140.33533, "r_x2": 270.65021, "r_y2": 134.59473000000003, "r_x3": 247.51601, "r_y3": 134.59473000000003, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 94.75982999999997, "r_x1": 365.55347, "r_y1": 94.75982999999997, "r_x2": 365.55347, "r_y2": 89.01923, "r_x3": 330.63071, "r_y3": 89.01923, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 102.91985999999997, "r_x1": 370.22717, "r_y1": 102.91985999999997, "r_x2": 370.22717, "r_y2": 97.17926, "r_x3": 330.63071, "r_y3": 97.17926, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 111.07983000000002, "r_x1": 374.51157, "r_y1": 111.07983000000002, "r_x2": 374.51157, "r_y2": 105.33922999999993, "r_x3": 330.63071, "r_y3": 105.33922999999993, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 119.23987, "r_x1": 335.73233, "r_y1": 119.23987, "r_x2": 335.73233, "r_y2": 113.49926999999991, "r_x3": 330.63071, "r_y3": 113.49926999999991, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 146.57617000000005, "r_x1": 335.05988, "r_y1": 146.57617000000005, "r_x2": 335.05988, "r_y2": 141.79236000000003, "r_x3": 322.30579, "r_y3": 141.79236000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 153.71613000000002, "r_x1": 335.05988, "r_y1": 153.71613000000002, "r_x2": 335.05988, "r_y2": 148.93231000000003, "r_x3": 322.30579, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.54971, "r_y0": 154.29638999999997, "r_x1": 340.95242, "r_y1": 154.29638999999997, "r_x2": 340.95242, "r_y2": 148.55579, "r_x3": 337.54971, "r_y3": 148.55579, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56262, "r_y0": 153.71613000000002, "r_x1": 398.91446, "r_y1": 153.71613000000002, "r_x2": 398.91446, "r_y2": 148.93231000000003, "r_x3": 343.56262, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.41718, "r_y0": 153.71613000000002, "r_x1": 421.58801, "r_y1": 153.71613000000002, "r_x2": 421.58801, "r_y2": 148.93231000000003, "r_x3": 407.41718, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 160.85613999999998, "r_x1": 349.23022, "r_y1": 160.85613999999998, "r_x2": 349.23022, "r_y2": 156.07232999999997, "r_x3": 322.30579, "r_y3": 156.07232999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 167.99614999999994, "r_x1": 335.05988, "r_y1": 167.99614999999994, "r_x2": 335.05988, "r_y2": 163.21234000000004, "r_x3": 322.30579, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56155, "r_y0": 167.99614999999994, "r_x1": 374.73685, "r_y1": 167.99614999999994, "r_x2": 374.73685, "r_y2": 163.21234000000004, "r_x3": 343.56155, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 175.13617, "r_x1": 326.55716, "r_y1": 175.13617, "r_x2": 326.55716, "r_y2": 170.35235999999998, "r_x3": 322.30579, "r_y3": 170.35235999999998, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51111, "r_y0": 95.41027999999994, "r_x1": 326.91382, "r_y1": 95.41027999999994, "r_x2": 326.91382, "r_y2": 89.66967999999997, "r_x3": 323.51111, "r_y3": 89.66967999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 103.52948000000004, "r_x1": 327.1178, "r_y1": 103.52948000000004, "r_x2": 327.1178, "r_y2": 97.78887999999995, "r_x3": 323.71509, "r_y3": 97.78887999999995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 111.73029000000008, "r_x1": 327.1178, "r_y1": 111.73029000000008, "r_x2": 327.1178, "r_y2": 105.98969, "r_x3": 323.71509, "r_y3": 105.98969, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.4816, "r_y0": 154.28687000000002, "r_x1": 404.88431, "r_y1": 154.28687000000002, "r_x2": 404.88431, "r_y2": 148.54625999999996, "r_x3": 401.4816, "r_y3": 148.54625999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.6976, "r_y0": 168.42511000000002, "r_x1": 341.10031, "r_y1": 168.42511000000002, "r_x2": 341.10031, "r_y2": 162.68451000000005, "r_x3": 337.6976, "r_y3": 162.68451000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46378, "r_y0": 110.28644000000008, "r_x1": 457.86648999999994, "r_y1": 110.28644000000008, "r_x2": 457.86648999999994, "r_y2": 104.54584, "r_x3": 454.46378, "r_y3": 104.54584, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.32580999999993, "r_y0": 96.83605999999997, "r_x1": 496.72852, "r_y1": 96.83605999999997, "r_x2": 496.72852, "r_y2": 91.09546, "r_x3": 493.32580999999993, "r_y3": 91.09546, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08298, "r_y0": 96.30939000000001, "r_x1": 457.48569000000003, "r_y1": 96.30939000000001, "r_x2": 457.48569000000003, "r_y2": 90.56879000000015, "r_x3": 454.08298, "r_y3": 90.56879000000015, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 81.688072, "t": 122.43970000000002, "r": 84.927567, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 125.62891000000002, "r_x1": 84.927567, "r_y1": 125.62891000000002, "r_x2": 84.927567, "r_y2": 122.43970000000002, "r_x3": 81.688072, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 86.54731, "t": 122.43970000000002, "r": 93.026291, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 125.62891000000002, "r_x1": 93.026291, "r_y1": 125.62891000000002, "r_x2": 93.026291, "r_y2": 122.43970000000002, "r_x3": 86.54731, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 102.50498, "t": 115.25214000000005, "r": 115.3461, "b": 118.44135000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.50498, "r_y0": 118.44135000000006, "r_x1": 115.3461, "r_y1": 118.44135000000006, "r_x2": 115.3461, "r_y2": 115.25214000000005, "r_x3": 102.50498, "r_y3": 115.25214000000005, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 82.140205, "t": 115.21489999999994, "r": 93.291527, "b": 118.40410999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.140205, "r_y0": 118.40410999999995, "r_x1": 93.291527, "r_y1": 118.40410999999995, "r_x2": 93.291527, "r_y2": 115.21489999999994, "r_x3": 82.140205, "r_y3": 115.21489999999994, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 96.748268, "t": 122.43970000000002, "r": 104.3119, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 125.62891000000002, "r_x1": 104.3119, "r_y1": 125.62891000000002, "r_x2": 104.3119, "r_y2": 122.43970000000002, "r_x3": 96.748268, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 96.748268, "t": 127.74370999999985, "r": 102.42083, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 130.93291999999997, "r_x1": 102.42083, "r_y1": 130.93291999999997, "r_x2": 102.42083, "r_y2": 127.74370999999985, "r_x3": 96.748268, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 96.748268, "t": 133.45569, "r": 104.3119, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 136.6449, "r_x1": 104.3119, "r_y1": 136.6449, "r_x2": 104.3119, "r_y2": 133.45569, "r_x3": 96.748268, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 96.748268, "t": 139.16772000000003, "r": 102.42083, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 142.35693000000003, "r_x1": 102.42083, "r_y1": 142.35693000000003, "r_x2": 102.42083, "r_y2": 139.16772000000003, "r_x3": 96.748268, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 110.66107, "t": 122.43970000000002, "r": 116.14391, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 125.62891000000002, "r_x1": 116.14391, "r_y1": 125.62891000000002, "r_x2": 116.14391, "r_y2": 122.43970000000002, "r_x3": 110.66107, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 110.66107, "t": 127.74370999999985, "r": 116.14391, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 130.93291999999997, "r_x1": 116.14391, "r_y1": 130.93291999999997, "r_x2": 116.14391, "r_y2": 127.74370999999985, "r_x3": 110.66107, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 110.66107, "t": 133.45569, "r": 116.14391, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 136.6449, "r_x1": 116.14391, "r_y1": 136.6449, "r_x2": 116.14391, "r_y2": 133.45569, "r_x3": 110.66107, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 110.66107, "t": 139.16772000000003, "r": 116.14391, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 142.35693000000003, "r_x1": 116.14391, "r_y1": 142.35693000000003, "r_x2": 116.14391, "r_y2": 139.16772000000003, "r_x3": 110.66107, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 81.688072, "t": 127.74370999999985, "r": 84.927567, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 130.93291999999997, "r_x1": 84.927567, "r_y1": 130.93291999999997, "r_x2": 84.927567, "r_y2": 127.74370999999985, "r_x3": 81.688072, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 86.54731, "t": 127.74370999999985, "r": 93.026291, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 130.93291999999997, "r_x1": 93.026291, "r_y1": 130.93291999999997, "r_x2": 93.026291, "r_y2": 127.74370999999985, "r_x3": 86.54731, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 81.688072, "t": 133.45569, "r": 84.927567, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 136.6449, "r_x1": 84.927567, "r_y1": 136.6449, "r_x2": 84.927567, "r_y2": 133.45569, "r_x3": 81.688072, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 86.54731, "t": 133.45569, "r": 93.026291, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 136.6449, "r_x1": 93.026291, "r_y1": 136.6449, "r_x2": 93.026291, "r_y2": 133.45569, "r_x3": 86.54731, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 81.688072, "t": 139.16772000000003, "r": 84.927567, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 142.35693000000003, "r_x1": 84.927567, "r_y1": 142.35693000000003, "r_x2": 84.927567, "r_y2": 139.16772000000003, "r_x3": 81.688072, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 86.54731, "t": 139.16772000000003, "r": 93.026291, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 142.35693000000003, "r_x1": 93.026291, "r_y1": 142.35693000000003, "r_x2": 93.026291, "r_y2": 139.16772000000003, "r_x3": 86.54731, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 88.084389, "t": 90.49738000000002, "r": 113.93649, "b": 96.23798, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.084389, "r_y0": 96.23798, "r_x1": 113.93649, "r_y1": 96.23798, "r_x2": 113.93649, "r_y2": 90.49738000000002, "r_x3": 88.084389, "r_y3": 90.49738000000002, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 82.81002, "t": 97.63738999999998, "r": 119.21240000000002, "b": 103.37798999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81002, "r_y0": 103.37798999999995, "r_x1": 119.21240000000002, "r_y1": 103.37798999999995, "r_x2": 119.21240000000002, "r_y2": 97.63738999999998, "r_x3": 82.81002, "r_y3": 97.63738999999998, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 143.94247, "t": 100.60235999999998, "r": 180.01131, "b": 106.34295999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94247, "r_y0": 106.34295999999995, "r_x1": 180.01131, "r_y1": 106.34295999999995, "r_x2": 180.01131, "r_y2": 100.60235999999998, "r_x3": 143.94247, "r_y3": 100.60235999999998, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 151.94064, "t": 107.74237000000005, "r": 172.0118, "b": 113.48297000000014, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94064, "r_y0": 113.48297000000014, "r_x1": 172.0118, "r_y1": 113.48297000000014, "r_x2": 172.0118, "r_y2": 107.74237000000005, "r_x3": 151.94064, "r_y3": 107.74237000000005, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 251.76939000000002, "t": 80.93096999999989, "r": 266.39557, "b": 86.67156999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.76939000000002, "r_y0": 86.67156999999997, "r_x1": 266.39557, "r_y1": 86.67156999999997, "r_x2": 266.39557, "r_y2": 80.93096999999989, "r_x3": 251.76939000000002, "r_y3": 80.93096999999989, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 247.51601, "t": 86.03101000000004, "r": 270.65021, "b": 91.77161000000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 91.77161000000001, "r_x1": 270.65021, "r_y1": 91.77161000000001, "r_x2": 270.65021, "r_y2": 86.03101000000004, "r_x3": 247.51601, "r_y3": 86.03101000000004, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 331.03699, "t": 78.55980999999997, "r": 352.12589, "b": 84.30042000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.03699, "r_y0": 84.30042000000003, "r_x1": 352.12589, "r_y1": 84.30042000000003, "r_x2": 352.12589, "r_y2": 78.55980999999997, "r_x3": 331.03699, "r_y3": 78.55980999999997, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 390.56421, "t": 96.03223000000003, "r": 431.7261, "b": 101.77282999999989, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56421, "r_y0": 101.77282999999989, "r_x1": 431.7261, "r_y1": 101.77282999999989, "r_x2": 431.7261, "r_y2": 96.03223000000003, "r_x3": 390.56421, "r_y3": 96.03223000000003, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 386.82422, "t": 102.15228000000013, "r": 435.46966999999995, "b": 107.89287999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82422, "r_y0": 107.89287999999999, "r_x1": 435.46966999999995, "r_y1": 107.89287999999999, "r_x2": 435.46966999999995, "r_y2": 102.15228000000013, "r_x3": 386.82422, "r_y3": 102.15228000000013, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 388.69589, "t": 108.27228000000002, "r": 433.6032400000001, "b": 114.01288000000011, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.69589, "r_y0": 114.01288000000011, "r_x1": 433.6032400000001, "r_y1": 114.01288000000011, "r_x2": 433.6032400000001, "r_y2": 108.27228000000002, "r_x3": 388.69589, "r_y3": 108.27228000000002, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 391.07761, "t": 114.39227000000005, "r": 431.22542999999996, "b": 120.13286999999991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.07761, "r_y0": 120.13286999999991, "r_x1": 431.22542999999996, "r_y1": 120.13286999999991, "r_x2": 431.22542999999996, "r_y2": 114.39227000000005, "r_x3": 391.07761, "r_y3": 114.39227000000005, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 431.22650000000004, "t": 151.68511999999998, "r": 498.82068, "b": 157.42571999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.22650000000004, "r_y0": 157.42571999999996, "r_x1": 498.82068, "r_y1": 157.42571999999996, "r_x2": 498.82068, "r_y2": 151.68511999999998, "r_x3": 431.22650000000004, "r_y3": 151.68511999999998, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 431.1738, "t": 157.80517999999995, "r": 498.87753000000004, "b": 163.54578000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.1738, "r_y0": 163.54578000000004, "r_x1": 498.87753000000004, "r_y1": 163.54578000000004, "r_x2": 498.87753000000004, "r_y2": 157.80517999999995, "r_x3": 431.1738, "r_y3": 157.80517999999995, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 440.5289, "t": 163.92516999999998, "r": 489.51827999999995, "b": 169.66576999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.5289, "r_y0": 169.66576999999995, "r_x1": 489.51827999999995, "r_y1": 169.66576999999995, "r_x2": 489.51827999999995, "r_y2": 163.92516999999998, "r_x3": 440.5289, "r_y3": 163.92516999999998, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 328.37479, "t": 178.25385000000006, "r": 367.72333, "b": 183.99445000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37479, "r_y0": 183.99445000000003, "r_x1": 367.72333, "r_y1": 183.99445000000003, "r_x2": 367.72333, "r_y2": 178.25385000000006, "r_x3": 328.37479, "r_y3": 178.25385000000006, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 331.84451, "t": 123.90886999999998, "r": 373.67963, "b": 129.64948000000015, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 129.64948000000015, "r_x1": 373.67963, "r_y1": 129.64948000000015, "r_x2": 373.67963, "r_y2": 123.90886999999998, "r_x3": 331.84451, "r_y3": 123.90886999999998, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 331.84451, "t": 129.00885000000017, "r": 381.17786, "b": 134.74945000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 134.74945000000002, "r_x1": 381.17786, "r_y1": 134.74945000000002, "r_x2": 381.17786, "r_y2": 129.00885000000017, "r_x3": 331.84451, "r_y3": 129.00885000000017, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 196.62633, "t": 88.11621000000002, "r": 219.42332, "b": 93.85681, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.62633, "r_y0": 93.85681, "r_x1": 219.42332, "r_y1": 93.85681, "r_x2": 219.42332, "r_y2": 88.11621000000002, "r_x3": 196.62633, "r_y3": 88.11621000000002, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 246.66771, "t": 129.4946900000001, "r": 271.49899, "b": 135.23528999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.66771, "r_y0": 135.23528999999996, "r_x1": 271.49899, "r_y1": 135.23528999999996, "r_x2": 271.49899, "r_y2": 129.4946900000001, "r_x3": 246.66771, "r_y3": 129.4946900000001, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 247.51601, "t": 134.59473000000003, "r": 270.65021, "b": 140.33533, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 140.33533, "r_x1": 270.65021, "r_y1": 140.33533, "r_x2": 270.65021, "r_y2": 134.59473000000003, "r_x3": 247.51601, "r_y3": 134.59473000000003, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 330.63071, "t": 89.01923, "r": 365.55347, "b": 94.75982999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 94.75982999999997, "r_x1": 365.55347, "r_y1": 94.75982999999997, "r_x2": 365.55347, "r_y2": 89.01923, "r_x3": 330.63071, "r_y3": 89.01923, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 330.63071, "t": 97.17926, "r": 370.22717, "b": 102.91985999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 102.91985999999997, "r_x1": 370.22717, "r_y1": 102.91985999999997, "r_x2": 370.22717, "r_y2": 97.17926, "r_x3": 330.63071, "r_y3": 97.17926, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 330.63071, "t": 105.33922999999993, "r": 374.51157, "b": 111.07983000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 111.07983000000002, "r_x1": 374.51157, "r_y1": 111.07983000000002, "r_x2": 374.51157, "r_y2": 105.33922999999993, "r_x3": 330.63071, "r_y3": 105.33922999999993, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 330.63071, "t": 113.49926999999991, "r": 335.73233, "b": 119.23987, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 119.23987, "r_x1": 335.73233, "r_y1": 119.23987, "r_x2": 335.73233, "r_y2": 113.49926999999991, "r_x3": 330.63071, "r_y3": 113.49926999999991, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 322.30579, "t": 141.79236000000003, "r": 335.05988, "b": 146.57617000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 146.57617000000005, "r_x1": 335.05988, "r_y1": 146.57617000000005, "r_x2": 335.05988, "r_y2": 141.79236000000003, "r_x3": 322.30579, "r_y3": 141.79236000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 322.30579, "t": 148.93231000000003, "r": 335.05988, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 153.71613000000002, "r_x1": 335.05988, "r_y1": 153.71613000000002, "r_x2": 335.05988, "r_y2": 148.93231000000003, "r_x3": 322.30579, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 337.54971, "t": 148.55579, "r": 340.95242, "b": 154.29638999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.54971, "r_y0": 154.29638999999997, "r_x1": 340.95242, "r_y1": 154.29638999999997, "r_x2": 340.95242, "r_y2": 148.55579, "r_x3": 337.54971, "r_y3": 148.55579, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 343.56262, "t": 148.93231000000003, "r": 398.91446, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56262, "r_y0": 153.71613000000002, "r_x1": 398.91446, "r_y1": 153.71613000000002, "r_x2": 398.91446, "r_y2": 148.93231000000003, "r_x3": 343.56262, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 407.41718, "t": 148.93231000000003, "r": 421.58801, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.41718, "r_y0": 153.71613000000002, "r_x1": 421.58801, "r_y1": 153.71613000000002, "r_x2": 421.58801, "r_y2": 148.93231000000003, "r_x3": 407.41718, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 322.30579, "t": 156.07232999999997, "r": 349.23022, "b": 160.85613999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 160.85613999999998, "r_x1": 349.23022, "r_y1": 160.85613999999998, "r_x2": 349.23022, "r_y2": 156.07232999999997, "r_x3": 322.30579, "r_y3": 156.07232999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 322.30579, "t": 163.21234000000004, "r": 335.05988, "b": 167.99614999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 167.99614999999994, "r_x1": 335.05988, "r_y1": 167.99614999999994, "r_x2": 335.05988, "r_y2": 163.21234000000004, "r_x3": 322.30579, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 343.56155, "t": 163.21234000000004, "r": 374.73685, "b": 167.99614999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56155, "r_y0": 167.99614999999994, "r_x1": 374.73685, "r_y1": 167.99614999999994, "r_x2": 374.73685, "r_y2": 163.21234000000004, "r_x3": 343.56155, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 322.30579, "t": 170.35235999999998, "r": 326.55716, "b": 175.13617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 175.13617, "r_x1": 326.55716, "r_y1": 175.13617, "r_x2": 326.55716, "r_y2": 170.35235999999998, "r_x3": 322.30579, "r_y3": 170.35235999999998, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 323.51111, "t": 89.66967999999997, "r": 326.91382, "b": 95.41027999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51111, "r_y0": 95.41027999999994, "r_x1": 326.91382, "r_y1": 95.41027999999994, "r_x2": 326.91382, "r_y2": 89.66967999999997, "r_x3": 323.51111, "r_y3": 89.66967999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 323.71509, "t": 97.78887999999995, "r": 327.1178, "b": 103.52948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 103.52948000000004, "r_x1": 327.1178, "r_y1": 103.52948000000004, "r_x2": 327.1178, "r_y2": 97.78887999999995, "r_x3": 323.71509, "r_y3": 97.78887999999995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 323.71509, "t": 105.98969, "r": 327.1178, "b": 111.73029000000008, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 111.73029000000008, "r_x1": 327.1178, "r_y1": 111.73029000000008, "r_x2": 327.1178, "r_y2": 105.98969, "r_x3": 323.71509, "r_y3": 105.98969, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 401.4816, "t": 148.54625999999996, "r": 404.88431, "b": 154.28687000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.4816, "r_y0": 154.28687000000002, "r_x1": 404.88431, "r_y1": 154.28687000000002, "r_x2": 404.88431, "r_y2": 148.54625999999996, "r_x3": 401.4816, "r_y3": 148.54625999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 337.6976, "t": 162.68451000000005, "r": 341.10031, "b": 168.42511000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.6976, "r_y0": 168.42511000000002, "r_x1": 341.10031, "r_y1": 168.42511000000002, "r_x2": 341.10031, "r_y2": 162.68451000000005, "r_x3": 337.6976, "r_y3": 162.68451000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 454.46378, "t": 104.54584, "r": 457.86648999999994, "b": 110.28644000000008, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46378, "r_y0": 110.28644000000008, "r_x1": 457.86648999999994, "r_y1": 110.28644000000008, "r_x2": 457.86648999999994, "r_y2": 104.54584, "r_x3": 454.46378, "r_y3": 104.54584, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 493.32580999999993, "t": 91.09546, "r": 496.72852, "b": 96.83605999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.32580999999993, "r_y0": 96.83605999999997, "r_x1": 496.72852, "r_y1": 96.83605999999997, "r_x2": 496.72852, "r_y2": 91.09546, "r_x3": 493.32580999999993, "r_y3": 91.09546, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 454.08298, "t": 90.56879000000015, "r": 457.48569000000003, "b": 96.30939000000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08298, "r_y0": 96.30939000000001, "r_x1": 457.48569000000003, "r_y1": 96.30939000000001, "r_x2": 457.48569000000003, "r_y2": 90.56879000000015, "r_x3": 454.08298, "r_y3": 90.56879000000015, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 6, "label": "caption", "bbox": { "l": 50.111992, "t": 203.98577999999998, "r": 545.10846, "b": 224.96691999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9677652716636658, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 213.01189999999997, "r_x1": 86.883949, "r_y1": 213.01189999999997, "r_x2": 86.883949, "r_y2": 204.10535000000004, "r_x3": 50.112, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.020996, "r_y0": 212.94214, "r_x1": 149.85141, "r_y1": 212.94214, "r_x2": 149.85141, "r_y2": 203.98577999999998, "r_x3": 94.020996, "r_y3": 203.98577999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86099, "r_y0": 213.01189999999997, "r_x1": 545.10846, "r_y1": 213.01189999999997, "r_x2": 545.10846, "r_y2": 204.10535000000004, "r_x3": 152.86099, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 224.96691999999996, "r_x1": 436.0134, "r_y1": 224.96691999999996, "r_x2": 436.0134, "r_y2": 216.06035999999995, "r_x3": 50.111992, "r_y3": 216.06035999999995, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "picture", "bbox": { "l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT" }, "confidence": 0.9724942445755005, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.253464, "r_y0": 264.17474000000004, "r_x1": 101.75846, "r_y1": 264.17474000000004, "r_x2": 101.75846, "r_y2": 258.21472000000006, "r_x3": 74.253464, "r_y3": 258.21472000000006, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.29972, "r_y0": 264.30524, "r_x1": 157.83972, "r_y1": 264.30524, "r_x2": 157.83972, "r_y2": 258.34520999999995, "r_x3": 122.29972, "r_y3": 258.34520999999995, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.549347, "r_y0": 377.04782, "r_x1": 125.68359000000001, "r_y1": 377.04782, "r_x2": 125.68359000000001, "r_y2": 371.38579999999996, "r_x3": 78.549347, "r_y3": 371.38579999999996, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.513298, "r_y0": 396.98059, "r_x1": 84.644547, "r_y1": 396.98059, "r_x2": 84.644547, "r_y2": 391.31857, "r_x3": 78.513298, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.52705, "r_y0": 396.98059, "r_x1": 125.11079999999998, "r_y1": 396.98059, "r_x2": 125.11079999999998, "r_y2": 391.31857, "r_x3": 116.52705, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.024773, "r_y0": 430.11511, "r_x1": 127.92327000000002, "r_y1": 430.11511, "r_x2": 127.92327000000002, "r_y2": 424.45309, "r_x3": 76.024773, "r_y3": 424.45309, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.382828, "r_y0": 450.55157, "r_x1": 84.514076, "r_y1": 450.55157, "r_x2": 84.514076, "r_y2": 444.88956, "r_x3": 78.382828, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.39658, "r_y0": 450.55157, "r_x1": 124.98033, "r_y1": 450.55157, "r_x2": 124.98033, "r_y2": 444.88956, "r_x3": 116.39658, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.46945, "r_y0": 468.10526, "r_x1": 181.6292, "r_y1": 468.10526, "r_x2": 181.6292, "r_y2": 462.44324, "r_x3": 167.46945, "r_y3": 462.44324, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61292, "r_y0": 484.13309, "r_x1": 184.43242, "r_y1": 484.13309, "r_x2": 184.43242, "r_y2": 478.47107, "r_x3": 165.61292, "r_y3": 478.47107, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.319511, "r_y0": 330.22235000000006, "r_x1": 132.9245, "r_y1": 330.22235000000006, "r_x2": 132.9245, "r_y2": 324.26235999999994, "r_x3": 65.319511, "r_y3": 324.26235999999994, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51457, "r_y0": 274.72992, "r_x1": 162.98782, "r_y1": 274.72992, "r_x2": 162.98782, "r_y2": 269.66394, "r_x3": 119.51457, "r_y3": 269.66394, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.72858, "r_y0": 279.97992, "r_x1": 151.41083, "r_y1": 279.97992, "r_x2": 151.41083, "r_y2": 274.91394, "r_x3": 128.72858, "r_y3": 274.91394, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.434211999999995, "r_y0": 344.26993, "r_x1": 80.27021, "r_y1": 344.26993, "r_x2": 80.27021, "r_y2": 338.95993, "r_x3": 60.434211999999995, "r_y3": 338.95993, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.598457, "r_y0": 348.69604, "r_x1": 78.854958, "r_y1": 348.69604, "r_x2": 78.854958, "r_y2": 343.38605, "r_x3": 60.598457, "r_y3": 343.38605, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.82877, "r_y0": 298.68762, "r_x1": 154.66476, "r_y1": 298.68762, "r_x2": 154.66476, "r_y2": 293.37762, "r_x3": 134.82877, "r_y3": 293.37762, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99303, "r_y0": 303.11371, "r_x1": 153.24953, "r_y1": 303.11371, "r_x2": 153.24953, "r_y2": 297.80370999999997, "r_x3": 134.99303, "r_y3": 297.80370999999997, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 351.02063, "r_x1": 197.14943, "r_y1": 351.02063, "r_x2": 197.14943, "r_y2": 345.35861, "r_x3": 150.55193, "r_y3": 345.35861, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 400.08542, "r_x1": 156.68318, "r_y1": 400.08542, "r_x2": 156.68318, "r_y2": 394.4234, "r_x3": 150.55193, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 400.08542, "r_x1": 197.14943, "r_y1": 400.08542, "r_x2": 197.14943, "r_y2": 394.4234, "r_x3": 188.56567, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.18539, "r_y0": 381.33044, "r_x1": 197.31964, "r_y1": 381.33044, "r_x2": 197.31964, "r_y2": 375.66843, "r_x3": 150.18539, "r_y3": 375.66843, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 445.91049, "r_x1": 156.68318, "r_y1": 445.91049, "r_x2": 156.68318, "r_y2": 440.24847000000005, "r_x3": 150.55193, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 445.91049, "r_x1": 197.14943, "r_y1": 445.91049, "r_x2": 197.14943, "r_y2": 440.24847000000005, "r_x3": 188.56567, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86377, "r_y0": 427.75537, "r_x1": 199.76227, "r_y1": 427.75537, "r_x2": 199.76227, "r_y2": 422.09335, "r_x3": 147.86377, "r_y3": 422.09335, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.56567000000004, "r_y0": 319.92487, "r_x1": 255.72542, "r_y1": 319.92487, "r_x2": 255.72542, "r_y2": 314.26285000000007, "r_x3": 241.56567000000004, "r_y3": 314.26285000000007, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.91730000000004, "r_y0": 367.02695, "r_x1": 256.07706, "r_y1": 367.02695, "r_x2": 256.07706, "r_y2": 361.36493, "r_x3": 241.91730000000004, "r_y3": 361.36493, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.054, "r_y0": 342.28131, "r_x1": 248.72363000000004, "r_y1": 342.28131, "r_x2": 248.72363000000004, "r_y2": 336.61929000000003, "r_x3": 228.054, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.2919, "r_y0": 342.28131, "r_x1": 269.39325, "r_y1": 342.28131, "r_x2": 269.39325, "r_y2": 336.61929000000003, "r_x3": 246.2919, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.44568000000004, "r_y0": 410.80884, "r_x1": 238.73892, "r_y1": 410.80884, "r_x2": 238.73892, "r_y2": 405.14682, "r_x3": 228.44568000000004, "r_y3": 405.14682, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.29767, "r_y0": 410.86526, "r_x1": 271.77792, "r_y1": 410.86526, "r_x2": 271.77792, "r_y2": 405.2032500000001, "r_x3": 256.29767, "r_y3": 405.2032500000001, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.54543, "r_y0": 387.87546, "r_x1": 258.08942, "r_y1": 387.87546, "r_x2": 258.08942, "r_y2": 382.21344, "r_x3": 239.54543, "r_y3": 382.21344, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.14704100000001, "r_y0": 449.78326, "r_x1": 59.51152, "r_y1": 449.78326, "r_x2": 59.51152, "r_y2": 384.87183, "r_x3": 54.14704100000001, "r_y3": 384.87183, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.235424, "r_y0": 378.45421999999996, "r_x1": 59.30449699999999, "r_y1": 378.45421999999996, "r_x2": 59.30449699999999, "r_y2": 373.81232, "r_x3": 54.235424, "r_y3": 373.81232, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.295891, "r_y0": 490.36688, "r_x1": 122.16431, "r_y1": 490.36688, "r_x2": 122.16431, "r_y2": 484.53189, "r_x3": 85.295891, "r_y3": 484.53189, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.66599, "r_y0": 285.45572000000004, "r_x1": 265.3194, "r_y1": 285.45572000000004, "r_x2": 265.3194, "r_y2": 279.54607999999996, "r_x3": 229.66599, "r_y3": 279.54607999999996, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17369, "r_y0": 506.12943, "r_x1": 190.41711, "r_y1": 506.12943, "r_x2": 190.41711, "r_y2": 500.3031, "r_x3": 157.17369, "r_y3": 500.3031, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.81598999999997, "r_y0": 443.89206, "r_x1": 270.78442, "r_y1": 443.89206, "r_x2": 270.78442, "r_y2": 438.05542, "r_x3": 227.81598999999997, "r_y3": 438.05542, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.70262, "r_y0": 449.8904999999999, "r_x1": 263.51105, "r_y1": 449.8904999999999, "r_x2": 263.51105, "r_y2": 444.06183, "r_x3": 233.70262, "r_y3": 444.06183, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.74655, "r_y0": 298.75903, "r_x1": 212.16055, "r_y1": 298.75903, "r_x2": 212.16055, "r_y2": 293.39502, "r_x3": 184.74655, "r_y3": 293.39502, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91229, "r_y0": 304.50903, "r_x1": 216.74378999999996, "r_y1": 304.50903, "r_x2": 216.74378999999996, "r_y2": 299.14502, "r_x3": 178.91229, "r_y3": 299.14502, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.24574, "r_y0": 287.84817999999996, "r_x1": 198.89099, "r_y1": 287.84817999999996, "r_x2": 198.89099, "r_y2": 282.7822, "r_x3": 194.24574, "r_y3": 282.7822, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.45587, "r_y0": 277.82916, "r_x1": 276.47089, "r_y1": 277.82916, "r_x2": 276.47089, "r_y2": 271.86914, "r_x3": 221.45587, "r_y3": 271.86914, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65219, "r_y0": 329.10443, "r_x1": 197.29019, "r_y1": 329.10443, "r_x2": 197.29019, "r_y2": 323.44241, "r_x3": 151.65219, "r_y3": 323.44241, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43277, "r_y0": 335.10443, "r_x1": 184.19028, "r_y1": 335.10443, "r_x2": 184.19028, "r_y2": 329.44241, "r_x3": 163.43277, "r_y3": 329.44241, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 70, "label": "text", "bbox": { "l": 74.253464, "t": 258.21472000000006, "r": 101.75846, "b": 264.17474000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.253464, "r_y0": 264.17474000000004, "r_x1": 101.75846, "r_y1": 264.17474000000004, "r_x2": 101.75846, "r_y2": 258.21472000000006, "r_x3": 74.253464, "r_y3": 258.21472000000006, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 122.29972, "t": 258.34520999999995, "r": 157.83972, "b": 264.30524, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.29972, "r_y0": 264.30524, "r_x1": 157.83972, "r_y1": 264.30524, "r_x2": 157.83972, "r_y2": 258.34520999999995, "r_x3": 122.29972, "r_y3": 258.34520999999995, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 78.549347, "t": 371.38579999999996, "r": 125.68359000000001, "b": 377.04782, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.549347, "r_y0": 377.04782, "r_x1": 125.68359000000001, "r_y1": 377.04782, "r_x2": 125.68359000000001, "r_y2": 371.38579999999996, "r_x3": 78.549347, "r_y3": 371.38579999999996, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 78.513298, "t": 391.31857, "r": 84.644547, "b": 396.98059, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.513298, "r_y0": 396.98059, "r_x1": 84.644547, "r_y1": 396.98059, "r_x2": 84.644547, "r_y2": 391.31857, "r_x3": 78.513298, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 116.52705, "t": 391.31857, "r": 125.11079999999998, "b": 396.98059, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.52705, "r_y0": 396.98059, "r_x1": 125.11079999999998, "r_y1": 396.98059, "r_x2": 125.11079999999998, "r_y2": 391.31857, "r_x3": 116.52705, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 76.024773, "t": 424.45309, "r": 127.92327000000002, "b": 430.11511, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.024773, "r_y0": 430.11511, "r_x1": 127.92327000000002, "r_y1": 430.11511, "r_x2": 127.92327000000002, "r_y2": 424.45309, "r_x3": 76.024773, "r_y3": 424.45309, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 78.382828, "t": 444.88956, "r": 84.514076, "b": 450.55157, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.382828, "r_y0": 450.55157, "r_x1": 84.514076, "r_y1": 450.55157, "r_x2": 84.514076, "r_y2": 444.88956, "r_x3": 78.382828, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 116.39658, "t": 444.88956, "r": 124.98033, "b": 450.55157, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.39658, "r_y0": 450.55157, "r_x1": 124.98033, "r_y1": 450.55157, "r_x2": 124.98033, "r_y2": 444.88956, "r_x3": 116.39658, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 167.46945, "t": 462.44324, "r": 181.6292, "b": 468.10526, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.46945, "r_y0": 468.10526, "r_x1": 181.6292, "r_y1": 468.10526, "r_x2": 181.6292, "r_y2": 462.44324, "r_x3": 167.46945, "r_y3": 462.44324, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 165.61292, "t": 478.47107, "r": 184.43242, "b": 484.13309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61292, "r_y0": 484.13309, "r_x1": 184.43242, "r_y1": 484.13309, "r_x2": 184.43242, "r_y2": 478.47107, "r_x3": 165.61292, "r_y3": 478.47107, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 65.319511, "t": 324.26235999999994, "r": 132.9245, "b": 330.22235000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.319511, "r_y0": 330.22235000000006, "r_x1": 132.9245, "r_y1": 330.22235000000006, "r_x2": 132.9245, "r_y2": 324.26235999999994, "r_x3": 65.319511, "r_y3": 324.26235999999994, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 119.51457, "t": 269.66394, "r": 162.98782, "b": 274.72992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51457, "r_y0": 274.72992, "r_x1": 162.98782, "r_y1": 274.72992, "r_x2": 162.98782, "r_y2": 269.66394, "r_x3": 119.51457, "r_y3": 269.66394, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 128.72858, "t": 274.91394, "r": 151.41083, "b": 279.97992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.72858, "r_y0": 279.97992, "r_x1": 151.41083, "r_y1": 279.97992, "r_x2": 151.41083, "r_y2": 274.91394, "r_x3": 128.72858, "r_y3": 274.91394, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 60.434211999999995, "t": 338.95993, "r": 80.27021, "b": 344.26993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.434211999999995, "r_y0": 344.26993, "r_x1": 80.27021, "r_y1": 344.26993, "r_x2": 80.27021, "r_y2": 338.95993, "r_x3": 60.434211999999995, "r_y3": 338.95993, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 60.598457, "t": 343.38605, "r": 78.854958, "b": 348.69604, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.598457, "r_y0": 348.69604, "r_x1": 78.854958, "r_y1": 348.69604, "r_x2": 78.854958, "r_y2": 343.38605, "r_x3": 60.598457, "r_y3": 343.38605, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 134.82877, "t": 293.37762, "r": 154.66476, "b": 298.68762, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.82877, "r_y0": 298.68762, "r_x1": 154.66476, "r_y1": 298.68762, "r_x2": 154.66476, "r_y2": 293.37762, "r_x3": 134.82877, "r_y3": 293.37762, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 134.99303, "t": 297.80370999999997, "r": 153.24953, "b": 303.11371, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99303, "r_y0": 303.11371, "r_x1": 153.24953, "r_y1": 303.11371, "r_x2": 153.24953, "r_y2": 297.80370999999997, "r_x3": 134.99303, "r_y3": 297.80370999999997, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 150.55193, "t": 345.35861, "r": 197.14943, "b": 351.02063, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 351.02063, "r_x1": 197.14943, "r_y1": 351.02063, "r_x2": 197.14943, "r_y2": 345.35861, "r_x3": 150.55193, "r_y3": 345.35861, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 150.55193, "t": 394.4234, "r": 156.68318, "b": 400.08542, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 400.08542, "r_x1": 156.68318, "r_y1": 400.08542, "r_x2": 156.68318, "r_y2": 394.4234, "r_x3": 150.55193, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 188.56567, "t": 394.4234, "r": 197.14943, "b": 400.08542, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 400.08542, "r_x1": 197.14943, "r_y1": 400.08542, "r_x2": 197.14943, "r_y2": 394.4234, "r_x3": 188.56567, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 150.18539, "t": 375.66843, "r": 197.31964, "b": 381.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.18539, "r_y0": 381.33044, "r_x1": 197.31964, "r_y1": 381.33044, "r_x2": 197.31964, "r_y2": 375.66843, "r_x3": 150.18539, "r_y3": 375.66843, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 150.55193, "t": 440.24847000000005, "r": 156.68318, "b": 445.91049, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 445.91049, "r_x1": 156.68318, "r_y1": 445.91049, "r_x2": 156.68318, "r_y2": 440.24847000000005, "r_x3": 150.55193, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 188.56567, "t": 440.24847000000005, "r": 197.14943, "b": 445.91049, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 445.91049, "r_x1": 197.14943, "r_y1": 445.91049, "r_x2": 197.14943, "r_y2": 440.24847000000005, "r_x3": 188.56567, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 147.86377, "t": 422.09335, "r": 199.76227, "b": 427.75537, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86377, "r_y0": 427.75537, "r_x1": 199.76227, "r_y1": 427.75537, "r_x2": 199.76227, "r_y2": 422.09335, "r_x3": 147.86377, "r_y3": 422.09335, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 241.56567000000004, "t": 314.26285000000007, "r": 255.72542, "b": 319.92487, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.56567000000004, "r_y0": 319.92487, "r_x1": 255.72542, "r_y1": 319.92487, "r_x2": 255.72542, "r_y2": 314.26285000000007, "r_x3": 241.56567000000004, "r_y3": 314.26285000000007, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 241.91730000000004, "t": 361.36493, "r": 256.07706, "b": 367.02695, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.91730000000004, "r_y0": 367.02695, "r_x1": 256.07706, "r_y1": 367.02695, "r_x2": 256.07706, "r_y2": 361.36493, "r_x3": 241.91730000000004, "r_y3": 361.36493, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 228.054, "t": 336.61929000000003, "r": 248.72363000000004, "b": 342.28131, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.054, "r_y0": 342.28131, "r_x1": 248.72363000000004, "r_y1": 342.28131, "r_x2": 248.72363000000004, "r_y2": 336.61929000000003, "r_x3": 228.054, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 246.2919, "t": 336.61929000000003, "r": 269.39325, "b": 342.28131, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.2919, "r_y0": 342.28131, "r_x1": 269.39325, "r_y1": 342.28131, "r_x2": 269.39325, "r_y2": 336.61929000000003, "r_x3": 246.2919, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 228.44568000000004, "t": 405.14682, "r": 238.73892, "b": 410.80884, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.44568000000004, "r_y0": 410.80884, "r_x1": 238.73892, "r_y1": 410.80884, "r_x2": 238.73892, "r_y2": 405.14682, "r_x3": 228.44568000000004, "r_y3": 405.14682, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 256.29767, "t": 405.2032500000001, "r": 271.77792, "b": 410.86526, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.29767, "r_y0": 410.86526, "r_x1": 271.77792, "r_y1": 410.86526, "r_x2": 271.77792, "r_y2": 405.2032500000001, "r_x3": 256.29767, "r_y3": 405.2032500000001, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 239.54543, "t": 382.21344, "r": 258.08942, "b": 387.87546, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.54543, "r_y0": 387.87546, "r_x1": 258.08942, "r_y1": 387.87546, "r_x2": 258.08942, "r_y2": 382.21344, "r_x3": 239.54543, "r_y3": 382.21344, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 54.14704100000001, "t": 384.87183, "r": 59.51152, "b": 449.78326, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.14704100000001, "r_y0": 449.78326, "r_x1": 59.51152, "r_y1": 449.78326, "r_x2": 59.51152, "r_y2": 384.87183, "r_x3": 54.14704100000001, "r_y3": 384.87183, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 54.235424, "t": 373.81232, "r": 59.30449699999999, "b": 378.45421999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.235424, "r_y0": 378.45421999999996, "r_x1": 59.30449699999999, "r_y1": 378.45421999999996, "r_x2": 59.30449699999999, "r_y2": 373.81232, "r_x3": 54.235424, "r_y3": 373.81232, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 85.295891, "t": 484.53189, "r": 122.16431, "b": 490.36688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.295891, "r_y0": 490.36688, "r_x1": 122.16431, "r_y1": 490.36688, "r_x2": 122.16431, "r_y2": 484.53189, "r_x3": 85.295891, "r_y3": 484.53189, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 229.66599, "t": 279.54607999999996, "r": 265.3194, "b": 285.45572000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.66599, "r_y0": 285.45572000000004, "r_x1": 265.3194, "r_y1": 285.45572000000004, "r_x2": 265.3194, "r_y2": 279.54607999999996, "r_x3": 229.66599, "r_y3": 279.54607999999996, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 157.17369, "t": 500.3031, "r": 190.41711, "b": 506.12943, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17369, "r_y0": 506.12943, "r_x1": 190.41711, "r_y1": 506.12943, "r_x2": 190.41711, "r_y2": 500.3031, "r_x3": 157.17369, "r_y3": 500.3031, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 227.81598999999997, "t": 438.05542, "r": 270.78442, "b": 443.89206, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.81598999999997, "r_y0": 443.89206, "r_x1": 270.78442, "r_y1": 443.89206, "r_x2": 270.78442, "r_y2": 438.05542, "r_x3": 227.81598999999997, "r_y3": 438.05542, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 233.70262, "t": 444.06183, "r": 263.51105, "b": 449.8904999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.70262, "r_y0": 449.8904999999999, "r_x1": 263.51105, "r_y1": 449.8904999999999, "r_x2": 263.51105, "r_y2": 444.06183, "r_x3": 233.70262, "r_y3": 444.06183, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 184.74655, "t": 293.39502, "r": 212.16055, "b": 298.75903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.74655, "r_y0": 298.75903, "r_x1": 212.16055, "r_y1": 298.75903, "r_x2": 212.16055, "r_y2": 293.39502, "r_x3": 184.74655, "r_y3": 293.39502, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 178.91229, "t": 299.14502, "r": 216.74378999999996, "b": 304.50903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91229, "r_y0": 304.50903, "r_x1": 216.74378999999996, "r_y1": 304.50903, "r_x2": 216.74378999999996, "r_y2": 299.14502, "r_x3": 178.91229, "r_y3": 299.14502, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 194.24574, "t": 282.7822, "r": 198.89099, "b": 287.84817999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.24574, "r_y0": 287.84817999999996, "r_x1": 198.89099, "r_y1": 287.84817999999996, "r_x2": 198.89099, "r_y2": 282.7822, "r_x3": 194.24574, "r_y3": 282.7822, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 221.45587, "t": 271.86914, "r": 276.47089, "b": 277.82916, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.45587, "r_y0": 277.82916, "r_x1": 276.47089, "r_y1": 277.82916, "r_x2": 276.47089, "r_y2": 271.86914, "r_x3": 221.45587, "r_y3": 271.86914, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 151.65219, "t": 323.44241, "r": 197.29019, "b": 329.10443, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65219, "r_y0": 329.10443, "r_x1": 197.29019, "r_y1": 329.10443, "r_x2": 197.29019, "r_y2": 323.44241, "r_x3": 151.65219, "r_y3": 323.44241, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 163.43277, "t": 329.44241, "r": 184.19028, "b": 335.10443, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43277, "r_y0": 335.10443, "r_x1": 184.19028, "r_y1": 335.10443, "r_x2": 184.19028, "r_y2": 329.44241, "r_x3": 163.43277, "r_y3": 329.44241, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 8, "label": "caption", "bbox": { "l": 50.112, "t": 527.7828099999999, "r": 286.36597, "b": 680.27094, "coord_origin": "TOPLEFT" }, "confidence": 0.8913407325744629, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 536.80893, "r_x1": 229.78752, "r_y1": 536.80893, "r_x2": 229.78752, "r_y2": 527.90237, "r_x3": 50.112, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.787, "r_y0": 536.7392, "r_x1": 267.76196, "r_y1": 536.7392, "r_x2": 267.76196, "r_y2": 527.7828099999999, "r_x3": 231.787, "r_y3": 527.7828099999999, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76401, "r_y0": 536.80893, "r_x1": 286.36169, "r_y1": 536.80893, "r_x2": 286.36169, "r_y2": 527.90237, "r_x3": 269.76401, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 548.76393, "r_x1": 286.36508, "r_y1": 548.76393, "r_x2": 286.36508, "r_y2": 539.85738, "r_x3": 50.112015, "r_y3": 539.85738, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 560.71992, "r_x1": 205.84735, "r_y1": 560.71992, "r_x2": 205.84735, "r_y2": 551.81337, "r_x3": 50.112015, "r_y3": 551.81337, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.01802, "r_y0": 560.6501900000001, "r_x1": 286.36392, "r_y1": 560.6501900000001, "r_x2": 286.36392, "r_y2": 551.69382, "r_x3": 208.01802, "r_y3": 551.69382, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 572.67493, "r_x1": 64.498009, "r_y1": 572.67493, "r_x2": 64.498009, "r_y2": 563.76837, "r_x3": 50.112015, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.165016, "r_y0": 572.60519, "r_x1": 151.31288, "r_y1": 572.60519, "r_x2": 151.31288, "r_y2": 563.64882, "r_x3": 68.165016, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31302, "r_y0": 572.67493, "r_x1": 153.80367, "r_y1": 572.67493, "r_x2": 153.80367, "r_y2": 563.76837, "r_x3": 151.31302, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.41884, "r_y0": 572.67493, "r_x1": 241.93283000000002, "r_y1": 572.67493, "r_x2": 241.93283000000002, "r_y2": 563.76837, "r_x3": 160.41884, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.59502, "r_y0": 572.60519, "r_x1": 286.362, "r_y1": 572.60519, "r_x2": 286.362, "r_y2": 563.64882, "r_x3": 245.59502, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 584.5602, "r_x1": 85.519089, "r_y1": 584.5602, "r_x2": 85.519089, "r_y2": 575.60382, "r_x3": 50.112015, "r_y3": 575.60382, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.623016, "r_y0": 584.6299300000001, "r_x1": 286.36072, "r_y1": 584.6299300000001, "r_x2": 286.36072, "r_y2": 575.7233699999999, "r_x3": 88.623016, "r_y3": 575.7233699999999, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 596.58493, "r_x1": 286.36511, "r_y1": 596.58493, "r_x2": 286.36511, "r_y2": 587.6783800000001, "r_x3": 50.112015, "r_y3": 587.6783800000001, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 608.53993, "r_x1": 286.36508, "r_y1": 608.53993, "r_x2": 286.36508, "r_y2": 599.63338, "r_x3": 50.112015, "r_y3": 599.63338, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 620.4949300000001, "r_x1": 240.43756000000002, "r_y1": 620.4949300000001, "r_x2": 240.43756000000002, "r_y2": 611.58838, "r_x3": 50.112015, "r_y3": 611.58838, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.19801, "r_y0": 620.4252, "r_x1": 286.36597, "r_y1": 620.4252, "r_x2": 286.36597, "r_y2": 611.46883, "r_x3": 243.19801, "r_y3": 611.46883, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 632.3812, "r_x1": 286.36511, "r_y1": 632.3812, "r_x2": 286.36511, "r_y2": 623.42482, "r_x3": 50.112015, "r_y3": 623.42482, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 644.3362, "r_x1": 286.36508, "r_y1": 644.3362, "r_x2": 286.36508, "r_y2": 635.37982, "r_x3": 50.112015, "r_y3": 635.37982, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 656.36093, "r_x1": 220.58205, "r_y1": 656.36093, "r_x2": 220.58205, "r_y2": 647.45438, "r_x3": 50.112015, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.57802000000004, "r_y0": 656.14175, "r_x1": 228.32693, "r_y1": 656.14175, "r_x2": 228.32693, "r_y2": 647.29497, "r_x3": 220.57802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.32700999999997, "r_y0": 656.36093, "r_x1": 236.07791000000003, "r_y1": 656.36093, "r_x2": 236.07791000000003, "r_y2": 647.45438, "r_x3": 228.32700999999997, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.07802000000004, "r_y0": 656.14175, "r_x1": 243.82693, "r_y1": 656.14175, "r_x2": 243.82693, "r_y2": 647.29497, "r_x3": 236.07802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.82602, "r_y0": 656.36093, "r_x1": 255.29298000000003, "r_y1": 656.36093, "r_x2": 255.29298000000003, "r_y2": 647.45438, "r_x3": 243.82602, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29102000000003, "r_y0": 656.14175, "r_x1": 263.03992, "r_y1": 656.14175, "r_x2": 263.03992, "r_y2": 647.29497, "r_x3": 255.29102000000003, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04001, "r_y0": 656.36093, "r_x1": 286.36246, "r_y1": 656.36093, "r_x2": 286.36246, "r_y2": 647.45438, "r_x3": 263.04001, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 668.31594, "r_x1": 286.36511, "r_y1": 668.31594, "r_x2": 286.36511, "r_y2": 659.40938, "r_x3": 50.112015, "r_y3": 659.40938, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 680.27094, "r_x1": 218.46996, "r_y1": 680.27094, "r_x2": 218.46996, "r_y2": 671.36438, "r_x3": 50.112015, "r_y3": 671.36438, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 308.862, "t": 249.53441999999995, "r": 545.11505, "b": 294.3069499999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9831458330154419, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.44097999999997, "r_x1": 523.05786, "r_y1": 258.44097999999997, "r_x2": 523.05786, "r_y2": 249.53441999999995, "r_x3": 308.862, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.19983, "r_y0": 258.44097999999997, "r_x1": 545.11505, "r_y1": 258.44097999999997, "r_x2": 545.11505, "r_y2": 249.53441999999995, "r_x3": 525.19983, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.39697, "r_x1": 517.55847, "r_y1": 270.39697, "r_x2": 517.55847, "r_y2": 261.49042, "r_x3": 308.862, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 270.39697, "r_x1": 545.11499, "r_y1": 270.39697, "r_x2": 545.11499, "r_y2": 261.49042, "r_x3": 520.76642, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.35196, "r_x1": 534.80377, "r_y1": 282.35196, "r_x2": 534.80377, "r_y2": 273.44537, "r_x3": 308.862, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36414, "r_y0": 282.35196, "r_x1": 545.11505, "r_y1": 282.35196, "r_x2": 545.11505, "r_y2": 273.44537, "r_x3": 537.36414, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.3069499999999, "r_x1": 341.24045, "r_y1": 294.3069499999999, "r_x2": 341.24045, "r_y2": 285.40039, "r_x3": 308.862, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73099, "r_y0": 294.07782000000003, "r_x1": 417.23508, "r_y1": 294.07782000000003, "r_x2": 417.23508, "r_y2": 285.49005, "r_x3": 343.73099, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23398, "r_y0": 294.3069499999999, "r_x1": 436.60129, "r_y1": 294.3069499999999, "r_x2": 436.60129, "r_y2": 285.40039, "r_x3": 417.23398, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09198, "r_y0": 294.07782000000003, "r_x1": 516.56116, "r_y1": 294.07782000000003, "r_x2": 516.56116, "r_y2": 285.49005, "r_x3": 439.09198, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56097, "r_y0": 294.3069499999999, "r_x1": 519.05164, "r_y1": 294.3069499999999, "r_x2": 519.05164, "r_y2": 285.40039, "r_x3": 516.56097, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.86194, "t": 297.33981, "r": 545.11511, "b": 413.96182, "coord_origin": "TOPLEFT" }, "confidence": 0.9862009882926941, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 306.2962, "r_x1": 400.86649, "r_y1": 306.2962, "r_x2": 400.86649, "r_y2": 297.33981, "r_x3": 320.81696, "r_y3": 297.33981, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91394, "r_y0": 306.36594, "r_x1": 528.33685, "r_y1": 306.36594, "r_x2": 528.33685, "r_y2": 297.45938, "r_x3": 403.91394, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.7179, "r_y0": 306.36594, "r_x1": 545.11383, "r_y1": 306.36594, "r_x2": 545.11383, "r_y2": 297.45938, "r_x3": 530.7179, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 318.32092, "r_x1": 517.5285, "r_y1": 318.32092, "r_x2": 517.5285, "r_y2": 309.41437, "r_x3": 308.86194, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09387, "r_y0": 318.32092, "r_x1": 545.11493, "r_y1": 318.32092, "r_x2": 545.11493, "r_y2": 309.41437, "r_x3": 524.09387, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 330.27591, "r_x1": 432.35833999999994, "r_y1": 330.27591, "r_x2": 432.35833999999994, "r_y2": 321.36934999999994, "r_x3": 308.86194, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.81995000000006, "r_y0": 330.04678, "r_x1": 510.29041, "r_y1": 330.04678, "r_x2": 510.29041, "r_y2": 321.45901, "r_x3": 435.81995000000006, "r_y3": 321.45901, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.97797, "r_y0": 330.27591, "r_x1": 520.62305, "r_y1": 330.27591, "r_x2": 520.62305, "r_y2": 321.36934999999994, "r_x3": 513.97797, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08008, "r_y0": 330.27591, "r_x1": 545.11115, "r_y1": 330.27591, "r_x2": 545.11115, "r_y2": 321.36934999999994, "r_x3": 524.08008, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 342.2309, "r_x1": 527.76013, "r_y1": 342.2309, "r_x2": 527.76013, "r_y2": 333.32434, "r_x3": 308.86197, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.729, "r_y0": 342.2309, "r_x1": 545.11499, "r_y1": 342.2309, "r_x2": 545.11499, "r_y2": 333.32434, "r_x3": 530.729, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 354.18588, "r_x1": 526.85352, "r_y1": 354.18588, "r_x2": 526.85352, "r_y2": 345.27933, "r_x3": 308.86197, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62311, "r_y0": 354.18588, "r_x1": 545.11493, "r_y1": 354.18588, "r_x2": 545.11493, "r_y2": 345.27933, "r_x3": 529.62311, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 366.14188, "r_x1": 524.51245, "r_y1": 366.14188, "r_x2": 524.51245, "r_y2": 357.23532, "r_x3": 308.86197, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.96948, "r_y0": 366.14188, "r_x1": 545.11511, "r_y1": 366.14188, "r_x2": 545.11511, "r_y2": 357.23532, "r_x3": 527.96948, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 378.09685999999994, "r_x1": 370.39096, "r_y1": 378.09685999999994, "r_x2": 370.39096, "r_y2": 369.19031000000007, "r_x3": 308.86197, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44449, "r_y0": 378.09685999999994, "r_x1": 526.91339, "r_y1": 378.09685999999994, "r_x2": 526.91339, "r_y2": 369.19031000000007, "r_x3": 377.44449, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72906, "r_y0": 378.09685999999994, "r_x1": 545.11505, "r_y1": 378.09685999999994, "r_x2": 545.11505, "r_y2": 369.19031000000007, "r_x3": 530.72906, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 390.05185, "r_x1": 505.46395999999993, "r_y1": 390.05185, "r_x2": 505.46395999999993, "r_y2": 381.14529000000005, "r_x3": 308.86197, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03430000000003, "r_y0": 390.05185, "r_x1": 545.11511, "r_y1": 390.05185, "r_x2": 545.11511, "r_y2": 381.14529000000005, "r_x3": 508.03430000000003, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 402.00684, "r_x1": 517.68799, "r_y1": 402.00684, "r_x2": 517.68799, "r_y2": 393.10028, "r_x3": 308.86197, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 402.00684, "r_x1": 545.11499, "r_y1": 402.00684, "r_x2": 545.11499, "r_y2": 393.10028, "r_x3": 520.76642, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 413.96182, "r_x1": 528.01935, "r_y1": 413.96182, "r_x2": 528.01935, "r_y2": 405.05526999999995, "r_x3": 308.86197, "r_y3": 405.05526999999995, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.86197, "t": 417.11426, "r": 545.11511, "b": 545.57271, "coord_origin": "TOPLEFT" }, "confidence": 0.9851906895637512, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 426.02081, "r_x1": 515.49609, "r_y1": 426.02081, "r_x2": 515.49609, "r_y2": 417.11426, "r_x3": 320.81696, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.7663, "r_y0": 426.02081, "r_x1": 545.11487, "r_y1": 426.02081, "r_x2": 545.11487, "r_y2": 417.11426, "r_x3": 520.7663, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 437.9758, "r_x1": 343.72107, "r_y1": 437.9758, "r_x2": 343.72107, "r_y2": 429.0692399999999, "r_x3": 308.86197, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.03796, "r_y0": 437.74667, "r_x1": 446.45471000000003, "r_y1": 437.74667, "r_x2": 446.45471000000003, "r_y2": 429.15891, "r_x3": 347.03796, "r_y3": 429.15891, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.93996999999996, "r_y0": 437.9758, "r_x1": 503.06055000000003, "r_y1": 437.9758, "r_x2": 503.06055000000003, "r_y2": 429.0692399999999, "r_x3": 449.93996999999996, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.37808, "r_y0": 437.9758, "r_x1": 537.3717, "r_y1": 437.9758, "r_x2": 537.3717, "r_y2": 429.0692399999999, "r_x3": 506.37808, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.68927, "r_y0": 437.9758, "r_x1": 545.11267, "r_y1": 437.9758, "r_x2": 545.11267, "r_y2": 429.0692399999999, "r_x3": 540.68927, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 449.93079, "r_x1": 522.78894, "r_y1": 449.93079, "r_x2": 522.78894, "r_y2": 441.02423, "r_x3": 308.86197, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.7478, "r_y0": 449.93079, "r_x1": 545.11511, "r_y1": 449.93079, "r_x2": 545.11511, "r_y2": 441.02423, "r_x3": 525.7478, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 461.88577, "r_x1": 384.14929, "r_y1": 461.88577, "r_x2": 384.14929, "r_y2": 452.97922, "r_x3": 308.86197, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37466, "r_y0": 461.88577, "r_x1": 527.84985, "r_y1": 461.88577, "r_x2": 527.84985, "r_y2": 452.97922, "r_x3": 393.37466, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39282, "r_y0": 461.88577, "r_x1": 545.11505, "r_y1": 461.88577, "r_x2": 545.11505, "r_y2": 452.97922, "r_x3": 532.39282, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 473.84177, "r_x1": 529.7627, "r_y1": 473.84177, "r_x2": 529.7627, "r_y2": 464.93521, "r_x3": 308.86197, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94073, "r_y0": 473.84177, "r_x1": 545.11505, "r_y1": 473.84177, "r_x2": 545.11505, "r_y2": 464.93521, "r_x3": 532.94073, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 485.79675, "r_x1": 514.17126, "r_y1": 485.79675, "r_x2": 514.17126, "r_y2": 476.8902, "r_x3": 308.86197, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89105, "r_y0": 485.79675, "r_x1": 545.11511, "r_y1": 485.79675, "r_x2": 545.11511, "r_y2": 476.8902, "r_x3": 516.89105, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.75174, "r_x1": 527.63068, "r_y1": 497.75174, "r_x2": 527.63068, "r_y2": 488.84518, "r_x3": 308.86197, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62317, "r_y0": 497.75174, "r_x1": 545.11499, "r_y1": 497.75174, "r_x2": 545.11499, "r_y2": 488.84518, "r_x3": 529.62317, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.70673, "r_x1": 508.3630999999999, "r_y1": 509.70673, "r_x2": 508.3630999999999, "r_y2": 500.80017, "r_x3": 308.86197, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09286000000003, "r_y0": 509.70673, "r_x1": 545.11511, "r_y1": 509.70673, "r_x2": 545.11511, "r_y2": 500.80017, "r_x3": 511.09286000000003, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.6617100000001, "r_x1": 545.11499, "r_y1": 521.6617100000001, "r_x2": 545.11499, "r_y2": 512.7551599999999, "r_x3": 308.86197, "r_y3": 512.7551599999999, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.61771, "r_x1": 545.11511, "r_y1": 533.61771, "r_x2": 545.11511, "r_y2": 524.71115, "r_x3": 308.86197, "r_y3": 524.71115, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.57271, "r_x1": 369.73349, "r_y1": 545.57271, "r_x2": 369.73349, "r_y2": 536.66615, "r_x3": 308.86197, "r_y3": 536.66615, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86194, "t": 548.6046, "r": 545.11511, "b": 653.27271, "coord_origin": "TOPLEFT" }, "confidence": 0.9869195818901062, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 557.56097, "r_x1": 404.76184, "r_y1": 557.56097, "r_x2": 404.76184, "r_y2": 548.6046, "r_x3": 320.81696, "r_y3": 548.6046, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34094, "r_y0": 557.63071, "r_x1": 545.11505, "r_y1": 557.63071, "r_x2": 545.11505, "r_y2": 548.72415, "r_x3": 410.34094, "r_y3": 548.72415, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 569.5867000000001, "r_x1": 545.11493, "r_y1": 569.5867000000001, "r_x2": 545.11493, "r_y2": 560.68015, "r_x3": 308.86194, "r_y3": 560.68015, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 581.5417, "r_x1": 545.11511, "r_y1": 581.5417, "r_x2": 545.11511, "r_y2": 572.6351500000001, "r_x3": 308.86194, "r_y3": 572.6351500000001, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 593.4967, "r_x1": 545.11493, "r_y1": 593.4967, "r_x2": 545.11493, "r_y2": 584.59015, "r_x3": 308.86194, "r_y3": 584.59015, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 605.45171, "r_x1": 545.11499, "r_y1": 605.45171, "r_x2": 545.11499, "r_y2": 596.54515, "r_x3": 308.86194, "r_y3": 596.54515, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 617.40671, "r_x1": 545.11505, "r_y1": 617.40671, "r_x2": 545.11505, "r_y2": 608.50015, "r_x3": 308.86194, "r_y3": 608.50015, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 629.36171, "r_x1": 545.11505, "r_y1": 629.36171, "r_x2": 545.11505, "r_y2": 620.45515, "r_x3": 308.86194, "r_y3": 620.45515, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 641.3177000000001, "r_x1": 381.67859, "r_y1": 641.3177000000001, "r_x2": 381.67859, "r_y2": 632.41115, "r_x3": 308.86194, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.99695, "r_y0": 641.09853, "r_x1": 391.74585, "r_y1": 641.09853, "r_x2": 391.74585, "r_y2": 632.25174, "r_x3": 383.99695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.74594, "r_y0": 641.3177000000001, "r_x1": 399.49686, "r_y1": 641.3177000000001, "r_x2": 399.49686, "r_y2": 632.41115, "r_x3": 391.74594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.49695, "r_y0": 641.09853, "r_x1": 407.24585, "r_y1": 641.09853, "r_x2": 407.24585, "r_y2": 632.25174, "r_x3": 399.49695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.24594, "r_y0": 641.3177000000001, "r_x1": 432.90958, "r_y1": 641.3177000000001, "r_x2": 432.90958, "r_y2": 632.41115, "r_x3": 407.24594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.90792999999996, "r_y0": 641.09853, "r_x1": 440.65683000000007, "r_y1": 641.09853, "r_x2": 440.65683000000007, "r_y2": 632.25174, "r_x3": 432.90792999999996, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.65691999999996, "r_y0": 641.3177000000001, "r_x1": 545.11475, "r_y1": 641.3177000000001, "r_x2": 545.11475, "r_y2": 632.41115, "r_x3": 440.65691999999996, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 653.27271, "r_x1": 398.96371, "r_y1": 653.27271, "r_x2": 398.96371, "r_y2": 644.3661500000001, "r_x3": 308.86194, "r_y3": 644.3661500000001, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.86194, "t": 656.42516, "r": 545.11505, "b": 713.151726, "coord_origin": "TOPLEFT" }, "confidence": 0.9852352142333984, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81693, "r_y0": 665.33172, "r_x1": 444.34316999999993, "r_y1": 665.33172, "r_x2": 444.34316999999993, "r_y2": 656.42516, "r_x3": 320.81693, "r_y3": 656.42516, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.00591999999995, "r_y0": 665.10258, "r_x1": 545.1076, "r_y1": 665.10258, "r_x2": 545.1076, "r_y2": 656.51482, "r_x3": 447.00591999999995, "r_y3": 656.51482, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 677.2867200000001, "r_x1": 545.11505, "r_y1": 677.2867200000001, "r_x2": 545.11505, "r_y2": 668.38016, "r_x3": 308.86194, "r_y3": 668.38016, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 689.24172, "r_x1": 545.11505, "r_y1": 689.24172, "r_x2": 545.11505, "r_y2": 680.33516, "r_x3": 308.86194, "r_y3": 680.33516, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 701.196724, "r_x1": 545.11505, "r_y1": 701.196724, "r_x2": 545.11505, "r_y2": 692.290161, "r_x3": 308.86194, "r_y3": 692.290161, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 713.151726, "r_x1": 545.11505, "r_y1": 713.151726, "r_x2": 545.11505, "r_y2": 704.245163, "r_x3": 308.86194, "r_y3": 704.245163, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_footer", "bbox": { "l": 295.12094, "t": 734.13316, "r": 300.10223, "b": 743.039722, "coord_origin": "TOPLEFT" }, "confidence": 0.8719564080238342, "cells": [ { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12094, "r_y0": 743.039722, "r_x1": 300.10223, "r_y1": 743.039722, "r_x2": 300.10223, "r_y2": 734.13316, "r_x3": 295.12094, "r_y3": 734.13316, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "picture", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT" }, "confidence": 0.9296807646751404, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 125.62891000000002, "r_x1": 84.927567, "r_y1": 125.62891000000002, "r_x2": 84.927567, "r_y2": 122.43970000000002, "r_x3": 81.688072, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 125.62891000000002, "r_x1": 93.026291, "r_y1": 125.62891000000002, "r_x2": 93.026291, "r_y2": 122.43970000000002, "r_x3": 86.54731, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.50498, "r_y0": 118.44135000000006, "r_x1": 115.3461, "r_y1": 118.44135000000006, "r_x2": 115.3461, "r_y2": 115.25214000000005, "r_x3": 102.50498, "r_y3": 115.25214000000005, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.140205, "r_y0": 118.40410999999995, "r_x1": 93.291527, "r_y1": 118.40410999999995, "r_x2": 93.291527, "r_y2": 115.21489999999994, "r_x3": 82.140205, "r_y3": 115.21489999999994, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 125.62891000000002, "r_x1": 104.3119, "r_y1": 125.62891000000002, "r_x2": 104.3119, "r_y2": 122.43970000000002, "r_x3": 96.748268, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 130.93291999999997, "r_x1": 102.42083, "r_y1": 130.93291999999997, "r_x2": 102.42083, "r_y2": 127.74370999999985, "r_x3": 96.748268, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 136.6449, "r_x1": 104.3119, "r_y1": 136.6449, "r_x2": 104.3119, "r_y2": 133.45569, "r_x3": 96.748268, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 142.35693000000003, "r_x1": 102.42083, "r_y1": 142.35693000000003, "r_x2": 102.42083, "r_y2": 139.16772000000003, "r_x3": 96.748268, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 125.62891000000002, "r_x1": 116.14391, "r_y1": 125.62891000000002, "r_x2": 116.14391, "r_y2": 122.43970000000002, "r_x3": 110.66107, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 130.93291999999997, "r_x1": 116.14391, "r_y1": 130.93291999999997, "r_x2": 116.14391, "r_y2": 127.74370999999985, "r_x3": 110.66107, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 136.6449, "r_x1": 116.14391, "r_y1": 136.6449, "r_x2": 116.14391, "r_y2": 133.45569, "r_x3": 110.66107, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 142.35693000000003, "r_x1": 116.14391, "r_y1": 142.35693000000003, "r_x2": 116.14391, "r_y2": 139.16772000000003, "r_x3": 110.66107, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 130.93291999999997, "r_x1": 84.927567, "r_y1": 130.93291999999997, "r_x2": 84.927567, "r_y2": 127.74370999999985, "r_x3": 81.688072, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 130.93291999999997, "r_x1": 93.026291, "r_y1": 130.93291999999997, "r_x2": 93.026291, "r_y2": 127.74370999999985, "r_x3": 86.54731, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 136.6449, "r_x1": 84.927567, "r_y1": 136.6449, "r_x2": 84.927567, "r_y2": 133.45569, "r_x3": 81.688072, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 136.6449, "r_x1": 93.026291, "r_y1": 136.6449, "r_x2": 93.026291, "r_y2": 133.45569, "r_x3": 86.54731, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 142.35693000000003, "r_x1": 84.927567, "r_y1": 142.35693000000003, "r_x2": 84.927567, "r_y2": 139.16772000000003, "r_x3": 81.688072, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 142.35693000000003, "r_x1": 93.026291, "r_y1": 142.35693000000003, "r_x2": 93.026291, "r_y2": 139.16772000000003, "r_x3": 86.54731, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.084389, "r_y0": 96.23798, "r_x1": 113.93649, "r_y1": 96.23798, "r_x2": 113.93649, "r_y2": 90.49738000000002, "r_x3": 88.084389, "r_y3": 90.49738000000002, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81002, "r_y0": 103.37798999999995, "r_x1": 119.21240000000002, "r_y1": 103.37798999999995, "r_x2": 119.21240000000002, "r_y2": 97.63738999999998, "r_x3": 82.81002, "r_y3": 97.63738999999998, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94247, "r_y0": 106.34295999999995, "r_x1": 180.01131, "r_y1": 106.34295999999995, "r_x2": 180.01131, "r_y2": 100.60235999999998, "r_x3": 143.94247, "r_y3": 100.60235999999998, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94064, "r_y0": 113.48297000000014, "r_x1": 172.0118, "r_y1": 113.48297000000014, "r_x2": 172.0118, "r_y2": 107.74237000000005, "r_x3": 151.94064, "r_y3": 107.74237000000005, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.76939000000002, "r_y0": 86.67156999999997, "r_x1": 266.39557, "r_y1": 86.67156999999997, "r_x2": 266.39557, "r_y2": 80.93096999999989, "r_x3": 251.76939000000002, "r_y3": 80.93096999999989, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 91.77161000000001, "r_x1": 270.65021, "r_y1": 91.77161000000001, "r_x2": 270.65021, "r_y2": 86.03101000000004, "r_x3": 247.51601, "r_y3": 86.03101000000004, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.03699, "r_y0": 84.30042000000003, "r_x1": 352.12589, "r_y1": 84.30042000000003, "r_x2": 352.12589, "r_y2": 78.55980999999997, "r_x3": 331.03699, "r_y3": 78.55980999999997, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56421, "r_y0": 101.77282999999989, "r_x1": 431.7261, "r_y1": 101.77282999999989, "r_x2": 431.7261, "r_y2": 96.03223000000003, "r_x3": 390.56421, "r_y3": 96.03223000000003, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82422, "r_y0": 107.89287999999999, "r_x1": 435.46966999999995, "r_y1": 107.89287999999999, "r_x2": 435.46966999999995, "r_y2": 102.15228000000013, "r_x3": 386.82422, "r_y3": 102.15228000000013, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.69589, "r_y0": 114.01288000000011, "r_x1": 433.6032400000001, "r_y1": 114.01288000000011, "r_x2": 433.6032400000001, "r_y2": 108.27228000000002, "r_x3": 388.69589, "r_y3": 108.27228000000002, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.07761, "r_y0": 120.13286999999991, "r_x1": 431.22542999999996, "r_y1": 120.13286999999991, "r_x2": 431.22542999999996, "r_y2": 114.39227000000005, "r_x3": 391.07761, "r_y3": 114.39227000000005, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.22650000000004, "r_y0": 157.42571999999996, "r_x1": 498.82068, "r_y1": 157.42571999999996, "r_x2": 498.82068, "r_y2": 151.68511999999998, "r_x3": 431.22650000000004, "r_y3": 151.68511999999998, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.1738, "r_y0": 163.54578000000004, "r_x1": 498.87753000000004, "r_y1": 163.54578000000004, "r_x2": 498.87753000000004, "r_y2": 157.80517999999995, "r_x3": 431.1738, "r_y3": 157.80517999999995, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.5289, "r_y0": 169.66576999999995, "r_x1": 489.51827999999995, "r_y1": 169.66576999999995, "r_x2": 489.51827999999995, "r_y2": 163.92516999999998, "r_x3": 440.5289, "r_y3": 163.92516999999998, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37479, "r_y0": 183.99445000000003, "r_x1": 367.72333, "r_y1": 183.99445000000003, "r_x2": 367.72333, "r_y2": 178.25385000000006, "r_x3": 328.37479, "r_y3": 178.25385000000006, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 129.64948000000015, "r_x1": 373.67963, "r_y1": 129.64948000000015, "r_x2": 373.67963, "r_y2": 123.90886999999998, "r_x3": 331.84451, "r_y3": 123.90886999999998, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 134.74945000000002, "r_x1": 381.17786, "r_y1": 134.74945000000002, "r_x2": 381.17786, "r_y2": 129.00885000000017, "r_x3": 331.84451, "r_y3": 129.00885000000017, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.62633, "r_y0": 93.85681, "r_x1": 219.42332, "r_y1": 93.85681, "r_x2": 219.42332, "r_y2": 88.11621000000002, "r_x3": 196.62633, "r_y3": 88.11621000000002, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.66771, "r_y0": 135.23528999999996, "r_x1": 271.49899, "r_y1": 135.23528999999996, "r_x2": 271.49899, "r_y2": 129.4946900000001, "r_x3": 246.66771, "r_y3": 129.4946900000001, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 140.33533, "r_x1": 270.65021, "r_y1": 140.33533, "r_x2": 270.65021, "r_y2": 134.59473000000003, "r_x3": 247.51601, "r_y3": 134.59473000000003, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 94.75982999999997, "r_x1": 365.55347, "r_y1": 94.75982999999997, "r_x2": 365.55347, "r_y2": 89.01923, "r_x3": 330.63071, "r_y3": 89.01923, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 102.91985999999997, "r_x1": 370.22717, "r_y1": 102.91985999999997, "r_x2": 370.22717, "r_y2": 97.17926, "r_x3": 330.63071, "r_y3": 97.17926, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 111.07983000000002, "r_x1": 374.51157, "r_y1": 111.07983000000002, "r_x2": 374.51157, "r_y2": 105.33922999999993, "r_x3": 330.63071, "r_y3": 105.33922999999993, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 119.23987, "r_x1": 335.73233, "r_y1": 119.23987, "r_x2": 335.73233, "r_y2": 113.49926999999991, "r_x3": 330.63071, "r_y3": 113.49926999999991, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 146.57617000000005, "r_x1": 335.05988, "r_y1": 146.57617000000005, "r_x2": 335.05988, "r_y2": 141.79236000000003, "r_x3": 322.30579, "r_y3": 141.79236000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 153.71613000000002, "r_x1": 335.05988, "r_y1": 153.71613000000002, "r_x2": 335.05988, "r_y2": 148.93231000000003, "r_x3": 322.30579, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.54971, "r_y0": 154.29638999999997, "r_x1": 340.95242, "r_y1": 154.29638999999997, "r_x2": 340.95242, "r_y2": 148.55579, "r_x3": 337.54971, "r_y3": 148.55579, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56262, "r_y0": 153.71613000000002, "r_x1": 398.91446, "r_y1": 153.71613000000002, "r_x2": 398.91446, "r_y2": 148.93231000000003, "r_x3": 343.56262, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.41718, "r_y0": 153.71613000000002, "r_x1": 421.58801, "r_y1": 153.71613000000002, "r_x2": 421.58801, "r_y2": 148.93231000000003, "r_x3": 407.41718, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 160.85613999999998, "r_x1": 349.23022, "r_y1": 160.85613999999998, "r_x2": 349.23022, "r_y2": 156.07232999999997, "r_x3": 322.30579, "r_y3": 156.07232999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 167.99614999999994, "r_x1": 335.05988, "r_y1": 167.99614999999994, "r_x2": 335.05988, "r_y2": 163.21234000000004, "r_x3": 322.30579, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56155, "r_y0": 167.99614999999994, "r_x1": 374.73685, "r_y1": 167.99614999999994, "r_x2": 374.73685, "r_y2": 163.21234000000004, "r_x3": 343.56155, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 175.13617, "r_x1": 326.55716, "r_y1": 175.13617, "r_x2": 326.55716, "r_y2": 170.35235999999998, "r_x3": 322.30579, "r_y3": 170.35235999999998, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51111, "r_y0": 95.41027999999994, "r_x1": 326.91382, "r_y1": 95.41027999999994, "r_x2": 326.91382, "r_y2": 89.66967999999997, "r_x3": 323.51111, "r_y3": 89.66967999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 103.52948000000004, "r_x1": 327.1178, "r_y1": 103.52948000000004, "r_x2": 327.1178, "r_y2": 97.78887999999995, "r_x3": 323.71509, "r_y3": 97.78887999999995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 111.73029000000008, "r_x1": 327.1178, "r_y1": 111.73029000000008, "r_x2": 327.1178, "r_y2": 105.98969, "r_x3": 323.71509, "r_y3": 105.98969, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.4816, "r_y0": 154.28687000000002, "r_x1": 404.88431, "r_y1": 154.28687000000002, "r_x2": 404.88431, "r_y2": 148.54625999999996, "r_x3": 401.4816, "r_y3": 148.54625999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.6976, "r_y0": 168.42511000000002, "r_x1": 341.10031, "r_y1": 168.42511000000002, "r_x2": 341.10031, "r_y2": 162.68451000000005, "r_x3": 337.6976, "r_y3": 162.68451000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46378, "r_y0": 110.28644000000008, "r_x1": 457.86648999999994, "r_y1": 110.28644000000008, "r_x2": 457.86648999999994, "r_y2": 104.54584, "r_x3": 454.46378, "r_y3": 104.54584, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.32580999999993, "r_y0": 96.83605999999997, "r_x1": 496.72852, "r_y1": 96.83605999999997, "r_x2": 496.72852, "r_y2": 91.09546, "r_x3": 493.32580999999993, "r_y3": 91.09546, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08298, "r_y0": 96.30939000000001, "r_x1": 457.48569000000003, "r_y1": 96.30939000000001, "r_x2": 457.48569000000003, "r_y2": 90.56879000000015, "r_x3": 454.08298, "r_y3": 90.56879000000015, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 81.688072, "t": 122.43970000000002, "r": 84.927567, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 125.62891000000002, "r_x1": 84.927567, "r_y1": 125.62891000000002, "r_x2": 84.927567, "r_y2": 122.43970000000002, "r_x3": 81.688072, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 86.54731, "t": 122.43970000000002, "r": 93.026291, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 125.62891000000002, "r_x1": 93.026291, "r_y1": 125.62891000000002, "r_x2": 93.026291, "r_y2": 122.43970000000002, "r_x3": 86.54731, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 102.50498, "t": 115.25214000000005, "r": 115.3461, "b": 118.44135000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.50498, "r_y0": 118.44135000000006, "r_x1": 115.3461, "r_y1": 118.44135000000006, "r_x2": 115.3461, "r_y2": 115.25214000000005, "r_x3": 102.50498, "r_y3": 115.25214000000005, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 82.140205, "t": 115.21489999999994, "r": 93.291527, "b": 118.40410999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.140205, "r_y0": 118.40410999999995, "r_x1": 93.291527, "r_y1": 118.40410999999995, "r_x2": 93.291527, "r_y2": 115.21489999999994, "r_x3": 82.140205, "r_y3": 115.21489999999994, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 96.748268, "t": 122.43970000000002, "r": 104.3119, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 125.62891000000002, "r_x1": 104.3119, "r_y1": 125.62891000000002, "r_x2": 104.3119, "r_y2": 122.43970000000002, "r_x3": 96.748268, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 96.748268, "t": 127.74370999999985, "r": 102.42083, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 130.93291999999997, "r_x1": 102.42083, "r_y1": 130.93291999999997, "r_x2": 102.42083, "r_y2": 127.74370999999985, "r_x3": 96.748268, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 96.748268, "t": 133.45569, "r": 104.3119, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 136.6449, "r_x1": 104.3119, "r_y1": 136.6449, "r_x2": 104.3119, "r_y2": 133.45569, "r_x3": 96.748268, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 96.748268, "t": 139.16772000000003, "r": 102.42083, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 142.35693000000003, "r_x1": 102.42083, "r_y1": 142.35693000000003, "r_x2": 102.42083, "r_y2": 139.16772000000003, "r_x3": 96.748268, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 110.66107, "t": 122.43970000000002, "r": 116.14391, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 125.62891000000002, "r_x1": 116.14391, "r_y1": 125.62891000000002, "r_x2": 116.14391, "r_y2": 122.43970000000002, "r_x3": 110.66107, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 110.66107, "t": 127.74370999999985, "r": 116.14391, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 130.93291999999997, "r_x1": 116.14391, "r_y1": 130.93291999999997, "r_x2": 116.14391, "r_y2": 127.74370999999985, "r_x3": 110.66107, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 110.66107, "t": 133.45569, "r": 116.14391, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 136.6449, "r_x1": 116.14391, "r_y1": 136.6449, "r_x2": 116.14391, "r_y2": 133.45569, "r_x3": 110.66107, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 110.66107, "t": 139.16772000000003, "r": 116.14391, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 142.35693000000003, "r_x1": 116.14391, "r_y1": 142.35693000000003, "r_x2": 116.14391, "r_y2": 139.16772000000003, "r_x3": 110.66107, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 81.688072, "t": 127.74370999999985, "r": 84.927567, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 130.93291999999997, "r_x1": 84.927567, "r_y1": 130.93291999999997, "r_x2": 84.927567, "r_y2": 127.74370999999985, "r_x3": 81.688072, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 86.54731, "t": 127.74370999999985, "r": 93.026291, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 130.93291999999997, "r_x1": 93.026291, "r_y1": 130.93291999999997, "r_x2": 93.026291, "r_y2": 127.74370999999985, "r_x3": 86.54731, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 81.688072, "t": 133.45569, "r": 84.927567, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 136.6449, "r_x1": 84.927567, "r_y1": 136.6449, "r_x2": 84.927567, "r_y2": 133.45569, "r_x3": 81.688072, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 86.54731, "t": 133.45569, "r": 93.026291, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 136.6449, "r_x1": 93.026291, "r_y1": 136.6449, "r_x2": 93.026291, "r_y2": 133.45569, "r_x3": 86.54731, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 81.688072, "t": 139.16772000000003, "r": 84.927567, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 142.35693000000003, "r_x1": 84.927567, "r_y1": 142.35693000000003, "r_x2": 84.927567, "r_y2": 139.16772000000003, "r_x3": 81.688072, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 86.54731, "t": 139.16772000000003, "r": 93.026291, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 142.35693000000003, "r_x1": 93.026291, "r_y1": 142.35693000000003, "r_x2": 93.026291, "r_y2": 139.16772000000003, "r_x3": 86.54731, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 88.084389, "t": 90.49738000000002, "r": 113.93649, "b": 96.23798, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.084389, "r_y0": 96.23798, "r_x1": 113.93649, "r_y1": 96.23798, "r_x2": 113.93649, "r_y2": 90.49738000000002, "r_x3": 88.084389, "r_y3": 90.49738000000002, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 82.81002, "t": 97.63738999999998, "r": 119.21240000000002, "b": 103.37798999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81002, "r_y0": 103.37798999999995, "r_x1": 119.21240000000002, "r_y1": 103.37798999999995, "r_x2": 119.21240000000002, "r_y2": 97.63738999999998, "r_x3": 82.81002, "r_y3": 97.63738999999998, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 143.94247, "t": 100.60235999999998, "r": 180.01131, "b": 106.34295999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94247, "r_y0": 106.34295999999995, "r_x1": 180.01131, "r_y1": 106.34295999999995, "r_x2": 180.01131, "r_y2": 100.60235999999998, "r_x3": 143.94247, "r_y3": 100.60235999999998, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 151.94064, "t": 107.74237000000005, "r": 172.0118, "b": 113.48297000000014, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94064, "r_y0": 113.48297000000014, "r_x1": 172.0118, "r_y1": 113.48297000000014, "r_x2": 172.0118, "r_y2": 107.74237000000005, "r_x3": 151.94064, "r_y3": 107.74237000000005, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 251.76939000000002, "t": 80.93096999999989, "r": 266.39557, "b": 86.67156999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.76939000000002, "r_y0": 86.67156999999997, "r_x1": 266.39557, "r_y1": 86.67156999999997, "r_x2": 266.39557, "r_y2": 80.93096999999989, "r_x3": 251.76939000000002, "r_y3": 80.93096999999989, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 247.51601, "t": 86.03101000000004, "r": 270.65021, "b": 91.77161000000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 91.77161000000001, "r_x1": 270.65021, "r_y1": 91.77161000000001, "r_x2": 270.65021, "r_y2": 86.03101000000004, "r_x3": 247.51601, "r_y3": 86.03101000000004, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 331.03699, "t": 78.55980999999997, "r": 352.12589, "b": 84.30042000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.03699, "r_y0": 84.30042000000003, "r_x1": 352.12589, "r_y1": 84.30042000000003, "r_x2": 352.12589, "r_y2": 78.55980999999997, "r_x3": 331.03699, "r_y3": 78.55980999999997, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 390.56421, "t": 96.03223000000003, "r": 431.7261, "b": 101.77282999999989, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56421, "r_y0": 101.77282999999989, "r_x1": 431.7261, "r_y1": 101.77282999999989, "r_x2": 431.7261, "r_y2": 96.03223000000003, "r_x3": 390.56421, "r_y3": 96.03223000000003, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 386.82422, "t": 102.15228000000013, "r": 435.46966999999995, "b": 107.89287999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82422, "r_y0": 107.89287999999999, "r_x1": 435.46966999999995, "r_y1": 107.89287999999999, "r_x2": 435.46966999999995, "r_y2": 102.15228000000013, "r_x3": 386.82422, "r_y3": 102.15228000000013, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 388.69589, "t": 108.27228000000002, "r": 433.6032400000001, "b": 114.01288000000011, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.69589, "r_y0": 114.01288000000011, "r_x1": 433.6032400000001, "r_y1": 114.01288000000011, "r_x2": 433.6032400000001, "r_y2": 108.27228000000002, "r_x3": 388.69589, "r_y3": 108.27228000000002, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 391.07761, "t": 114.39227000000005, "r": 431.22542999999996, "b": 120.13286999999991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.07761, "r_y0": 120.13286999999991, "r_x1": 431.22542999999996, "r_y1": 120.13286999999991, "r_x2": 431.22542999999996, "r_y2": 114.39227000000005, "r_x3": 391.07761, "r_y3": 114.39227000000005, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 431.22650000000004, "t": 151.68511999999998, "r": 498.82068, "b": 157.42571999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.22650000000004, "r_y0": 157.42571999999996, "r_x1": 498.82068, "r_y1": 157.42571999999996, "r_x2": 498.82068, "r_y2": 151.68511999999998, "r_x3": 431.22650000000004, "r_y3": 151.68511999999998, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 431.1738, "t": 157.80517999999995, "r": 498.87753000000004, "b": 163.54578000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.1738, "r_y0": 163.54578000000004, "r_x1": 498.87753000000004, "r_y1": 163.54578000000004, "r_x2": 498.87753000000004, "r_y2": 157.80517999999995, "r_x3": 431.1738, "r_y3": 157.80517999999995, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 440.5289, "t": 163.92516999999998, "r": 489.51827999999995, "b": 169.66576999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.5289, "r_y0": 169.66576999999995, "r_x1": 489.51827999999995, "r_y1": 169.66576999999995, "r_x2": 489.51827999999995, "r_y2": 163.92516999999998, "r_x3": 440.5289, "r_y3": 163.92516999999998, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 328.37479, "t": 178.25385000000006, "r": 367.72333, "b": 183.99445000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37479, "r_y0": 183.99445000000003, "r_x1": 367.72333, "r_y1": 183.99445000000003, "r_x2": 367.72333, "r_y2": 178.25385000000006, "r_x3": 328.37479, "r_y3": 178.25385000000006, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 331.84451, "t": 123.90886999999998, "r": 373.67963, "b": 129.64948000000015, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 129.64948000000015, "r_x1": 373.67963, "r_y1": 129.64948000000015, "r_x2": 373.67963, "r_y2": 123.90886999999998, "r_x3": 331.84451, "r_y3": 123.90886999999998, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 331.84451, "t": 129.00885000000017, "r": 381.17786, "b": 134.74945000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 134.74945000000002, "r_x1": 381.17786, "r_y1": 134.74945000000002, "r_x2": 381.17786, "r_y2": 129.00885000000017, "r_x3": 331.84451, "r_y3": 129.00885000000017, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 196.62633, "t": 88.11621000000002, "r": 219.42332, "b": 93.85681, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.62633, "r_y0": 93.85681, "r_x1": 219.42332, "r_y1": 93.85681, "r_x2": 219.42332, "r_y2": 88.11621000000002, "r_x3": 196.62633, "r_y3": 88.11621000000002, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 246.66771, "t": 129.4946900000001, "r": 271.49899, "b": 135.23528999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.66771, "r_y0": 135.23528999999996, "r_x1": 271.49899, "r_y1": 135.23528999999996, "r_x2": 271.49899, "r_y2": 129.4946900000001, "r_x3": 246.66771, "r_y3": 129.4946900000001, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 247.51601, "t": 134.59473000000003, "r": 270.65021, "b": 140.33533, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 140.33533, "r_x1": 270.65021, "r_y1": 140.33533, "r_x2": 270.65021, "r_y2": 134.59473000000003, "r_x3": 247.51601, "r_y3": 134.59473000000003, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 330.63071, "t": 89.01923, "r": 365.55347, "b": 94.75982999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 94.75982999999997, "r_x1": 365.55347, "r_y1": 94.75982999999997, "r_x2": 365.55347, "r_y2": 89.01923, "r_x3": 330.63071, "r_y3": 89.01923, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 330.63071, "t": 97.17926, "r": 370.22717, "b": 102.91985999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 102.91985999999997, "r_x1": 370.22717, "r_y1": 102.91985999999997, "r_x2": 370.22717, "r_y2": 97.17926, "r_x3": 330.63071, "r_y3": 97.17926, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 330.63071, "t": 105.33922999999993, "r": 374.51157, "b": 111.07983000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 111.07983000000002, "r_x1": 374.51157, "r_y1": 111.07983000000002, "r_x2": 374.51157, "r_y2": 105.33922999999993, "r_x3": 330.63071, "r_y3": 105.33922999999993, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 330.63071, "t": 113.49926999999991, "r": 335.73233, "b": 119.23987, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 119.23987, "r_x1": 335.73233, "r_y1": 119.23987, "r_x2": 335.73233, "r_y2": 113.49926999999991, "r_x3": 330.63071, "r_y3": 113.49926999999991, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 322.30579, "t": 141.79236000000003, "r": 335.05988, "b": 146.57617000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 146.57617000000005, "r_x1": 335.05988, "r_y1": 146.57617000000005, "r_x2": 335.05988, "r_y2": 141.79236000000003, "r_x3": 322.30579, "r_y3": 141.79236000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 322.30579, "t": 148.93231000000003, "r": 335.05988, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 153.71613000000002, "r_x1": 335.05988, "r_y1": 153.71613000000002, "r_x2": 335.05988, "r_y2": 148.93231000000003, "r_x3": 322.30579, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 337.54971, "t": 148.55579, "r": 340.95242, "b": 154.29638999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.54971, "r_y0": 154.29638999999997, "r_x1": 340.95242, "r_y1": 154.29638999999997, "r_x2": 340.95242, "r_y2": 148.55579, "r_x3": 337.54971, "r_y3": 148.55579, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 343.56262, "t": 148.93231000000003, "r": 398.91446, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56262, "r_y0": 153.71613000000002, "r_x1": 398.91446, "r_y1": 153.71613000000002, "r_x2": 398.91446, "r_y2": 148.93231000000003, "r_x3": 343.56262, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 407.41718, "t": 148.93231000000003, "r": 421.58801, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.41718, "r_y0": 153.71613000000002, "r_x1": 421.58801, "r_y1": 153.71613000000002, "r_x2": 421.58801, "r_y2": 148.93231000000003, "r_x3": 407.41718, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 322.30579, "t": 156.07232999999997, "r": 349.23022, "b": 160.85613999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 160.85613999999998, "r_x1": 349.23022, "r_y1": 160.85613999999998, "r_x2": 349.23022, "r_y2": 156.07232999999997, "r_x3": 322.30579, "r_y3": 156.07232999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 322.30579, "t": 163.21234000000004, "r": 335.05988, "b": 167.99614999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 167.99614999999994, "r_x1": 335.05988, "r_y1": 167.99614999999994, "r_x2": 335.05988, "r_y2": 163.21234000000004, "r_x3": 322.30579, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 343.56155, "t": 163.21234000000004, "r": 374.73685, "b": 167.99614999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56155, "r_y0": 167.99614999999994, "r_x1": 374.73685, "r_y1": 167.99614999999994, "r_x2": 374.73685, "r_y2": 163.21234000000004, "r_x3": 343.56155, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 322.30579, "t": 170.35235999999998, "r": 326.55716, "b": 175.13617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 175.13617, "r_x1": 326.55716, "r_y1": 175.13617, "r_x2": 326.55716, "r_y2": 170.35235999999998, "r_x3": 322.30579, "r_y3": 170.35235999999998, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 323.51111, "t": 89.66967999999997, "r": 326.91382, "b": 95.41027999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51111, "r_y0": 95.41027999999994, "r_x1": 326.91382, "r_y1": 95.41027999999994, "r_x2": 326.91382, "r_y2": 89.66967999999997, "r_x3": 323.51111, "r_y3": 89.66967999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 323.71509, "t": 97.78887999999995, "r": 327.1178, "b": 103.52948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 103.52948000000004, "r_x1": 327.1178, "r_y1": 103.52948000000004, "r_x2": 327.1178, "r_y2": 97.78887999999995, "r_x3": 323.71509, "r_y3": 97.78887999999995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 323.71509, "t": 105.98969, "r": 327.1178, "b": 111.73029000000008, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 111.73029000000008, "r_x1": 327.1178, "r_y1": 111.73029000000008, "r_x2": 327.1178, "r_y2": 105.98969, "r_x3": 323.71509, "r_y3": 105.98969, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 401.4816, "t": 148.54625999999996, "r": 404.88431, "b": 154.28687000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.4816, "r_y0": 154.28687000000002, "r_x1": 404.88431, "r_y1": 154.28687000000002, "r_x2": 404.88431, "r_y2": 148.54625999999996, "r_x3": 401.4816, "r_y3": 148.54625999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 337.6976, "t": 162.68451000000005, "r": 341.10031, "b": 168.42511000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.6976, "r_y0": 168.42511000000002, "r_x1": 341.10031, "r_y1": 168.42511000000002, "r_x2": 341.10031, "r_y2": 162.68451000000005, "r_x3": 337.6976, "r_y3": 162.68451000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 454.46378, "t": 104.54584, "r": 457.86648999999994, "b": 110.28644000000008, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46378, "r_y0": 110.28644000000008, "r_x1": 457.86648999999994, "r_y1": 110.28644000000008, "r_x2": 457.86648999999994, "r_y2": 104.54584, "r_x3": 454.46378, "r_y3": 104.54584, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 493.32580999999993, "t": 91.09546, "r": 496.72852, "b": 96.83605999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.32580999999993, "r_y0": 96.83605999999997, "r_x1": 496.72852, "r_y1": 96.83605999999997, "r_x2": 496.72852, "r_y2": 91.09546, "r_x3": 493.32580999999993, "r_y3": 91.09546, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 454.08298, "t": 90.56879000000015, "r": 457.48569000000003, "b": 96.30939000000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08298, "r_y0": 96.30939000000001, "r_x1": 457.48569000000003, "r_y1": 96.30939000000001, "r_x2": 457.48569000000003, "r_y2": 90.56879000000015, "r_x3": 454.08298, "r_y3": 90.56879000000015, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.111992, "t": 203.98577999999998, "r": 545.10846, "b": 224.96691999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9677652716636658, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 213.01189999999997, "r_x1": 86.883949, "r_y1": 213.01189999999997, "r_x2": 86.883949, "r_y2": 204.10535000000004, "r_x3": 50.112, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.020996, "r_y0": 212.94214, "r_x1": 149.85141, "r_y1": 212.94214, "r_x2": 149.85141, "r_y2": 203.98577999999998, "r_x3": 94.020996, "r_y3": 203.98577999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86099, "r_y0": 213.01189999999997, "r_x1": 545.10846, "r_y1": 213.01189999999997, "r_x2": 545.10846, "r_y2": 204.10535000000004, "r_x3": 152.86099, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 224.96691999999996, "r_x1": 436.0134, "r_y1": 224.96691999999996, "r_x2": 436.0134, "r_y2": 216.06035999999995, "r_x3": 50.111992, "r_y3": 216.06035999999995, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure." }, { "label": "picture", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT" }, "confidence": 0.9724942445755005, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.253464, "r_y0": 264.17474000000004, "r_x1": 101.75846, "r_y1": 264.17474000000004, "r_x2": 101.75846, "r_y2": 258.21472000000006, "r_x3": 74.253464, "r_y3": 258.21472000000006, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.29972, "r_y0": 264.30524, "r_x1": 157.83972, "r_y1": 264.30524, "r_x2": 157.83972, "r_y2": 258.34520999999995, "r_x3": 122.29972, "r_y3": 258.34520999999995, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.549347, "r_y0": 377.04782, "r_x1": 125.68359000000001, "r_y1": 377.04782, "r_x2": 125.68359000000001, "r_y2": 371.38579999999996, "r_x3": 78.549347, "r_y3": 371.38579999999996, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.513298, "r_y0": 396.98059, "r_x1": 84.644547, "r_y1": 396.98059, "r_x2": 84.644547, "r_y2": 391.31857, "r_x3": 78.513298, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.52705, "r_y0": 396.98059, "r_x1": 125.11079999999998, "r_y1": 396.98059, "r_x2": 125.11079999999998, "r_y2": 391.31857, "r_x3": 116.52705, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.024773, "r_y0": 430.11511, "r_x1": 127.92327000000002, "r_y1": 430.11511, "r_x2": 127.92327000000002, "r_y2": 424.45309, "r_x3": 76.024773, "r_y3": 424.45309, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.382828, "r_y0": 450.55157, "r_x1": 84.514076, "r_y1": 450.55157, "r_x2": 84.514076, "r_y2": 444.88956, "r_x3": 78.382828, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.39658, "r_y0": 450.55157, "r_x1": 124.98033, "r_y1": 450.55157, "r_x2": 124.98033, "r_y2": 444.88956, "r_x3": 116.39658, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.46945, "r_y0": 468.10526, "r_x1": 181.6292, "r_y1": 468.10526, "r_x2": 181.6292, "r_y2": 462.44324, "r_x3": 167.46945, "r_y3": 462.44324, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61292, "r_y0": 484.13309, "r_x1": 184.43242, "r_y1": 484.13309, "r_x2": 184.43242, "r_y2": 478.47107, "r_x3": 165.61292, "r_y3": 478.47107, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.319511, "r_y0": 330.22235000000006, "r_x1": 132.9245, "r_y1": 330.22235000000006, "r_x2": 132.9245, "r_y2": 324.26235999999994, "r_x3": 65.319511, "r_y3": 324.26235999999994, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51457, "r_y0": 274.72992, "r_x1": 162.98782, "r_y1": 274.72992, "r_x2": 162.98782, "r_y2": 269.66394, "r_x3": 119.51457, "r_y3": 269.66394, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.72858, "r_y0": 279.97992, "r_x1": 151.41083, "r_y1": 279.97992, "r_x2": 151.41083, "r_y2": 274.91394, "r_x3": 128.72858, "r_y3": 274.91394, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.434211999999995, "r_y0": 344.26993, "r_x1": 80.27021, "r_y1": 344.26993, "r_x2": 80.27021, "r_y2": 338.95993, "r_x3": 60.434211999999995, "r_y3": 338.95993, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.598457, "r_y0": 348.69604, "r_x1": 78.854958, "r_y1": 348.69604, "r_x2": 78.854958, "r_y2": 343.38605, "r_x3": 60.598457, "r_y3": 343.38605, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.82877, "r_y0": 298.68762, "r_x1": 154.66476, "r_y1": 298.68762, "r_x2": 154.66476, "r_y2": 293.37762, "r_x3": 134.82877, "r_y3": 293.37762, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99303, "r_y0": 303.11371, "r_x1": 153.24953, "r_y1": 303.11371, "r_x2": 153.24953, "r_y2": 297.80370999999997, "r_x3": 134.99303, "r_y3": 297.80370999999997, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 351.02063, "r_x1": 197.14943, "r_y1": 351.02063, "r_x2": 197.14943, "r_y2": 345.35861, "r_x3": 150.55193, "r_y3": 345.35861, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 400.08542, "r_x1": 156.68318, "r_y1": 400.08542, "r_x2": 156.68318, "r_y2": 394.4234, "r_x3": 150.55193, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 400.08542, "r_x1": 197.14943, "r_y1": 400.08542, "r_x2": 197.14943, "r_y2": 394.4234, "r_x3": 188.56567, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.18539, "r_y0": 381.33044, "r_x1": 197.31964, "r_y1": 381.33044, "r_x2": 197.31964, "r_y2": 375.66843, "r_x3": 150.18539, "r_y3": 375.66843, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 445.91049, "r_x1": 156.68318, "r_y1": 445.91049, "r_x2": 156.68318, "r_y2": 440.24847000000005, "r_x3": 150.55193, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 445.91049, "r_x1": 197.14943, "r_y1": 445.91049, "r_x2": 197.14943, "r_y2": 440.24847000000005, "r_x3": 188.56567, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86377, "r_y0": 427.75537, "r_x1": 199.76227, "r_y1": 427.75537, "r_x2": 199.76227, "r_y2": 422.09335, "r_x3": 147.86377, "r_y3": 422.09335, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.56567000000004, "r_y0": 319.92487, "r_x1": 255.72542, "r_y1": 319.92487, "r_x2": 255.72542, "r_y2": 314.26285000000007, "r_x3": 241.56567000000004, "r_y3": 314.26285000000007, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.91730000000004, "r_y0": 367.02695, "r_x1": 256.07706, "r_y1": 367.02695, "r_x2": 256.07706, "r_y2": 361.36493, "r_x3": 241.91730000000004, "r_y3": 361.36493, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.054, "r_y0": 342.28131, "r_x1": 248.72363000000004, "r_y1": 342.28131, "r_x2": 248.72363000000004, "r_y2": 336.61929000000003, "r_x3": 228.054, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.2919, "r_y0": 342.28131, "r_x1": 269.39325, "r_y1": 342.28131, "r_x2": 269.39325, "r_y2": 336.61929000000003, "r_x3": 246.2919, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.44568000000004, "r_y0": 410.80884, "r_x1": 238.73892, "r_y1": 410.80884, "r_x2": 238.73892, "r_y2": 405.14682, "r_x3": 228.44568000000004, "r_y3": 405.14682, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.29767, "r_y0": 410.86526, "r_x1": 271.77792, "r_y1": 410.86526, "r_x2": 271.77792, "r_y2": 405.2032500000001, "r_x3": 256.29767, "r_y3": 405.2032500000001, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.54543, "r_y0": 387.87546, "r_x1": 258.08942, "r_y1": 387.87546, "r_x2": 258.08942, "r_y2": 382.21344, "r_x3": 239.54543, "r_y3": 382.21344, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.14704100000001, "r_y0": 449.78326, "r_x1": 59.51152, "r_y1": 449.78326, "r_x2": 59.51152, "r_y2": 384.87183, "r_x3": 54.14704100000001, "r_y3": 384.87183, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.235424, "r_y0": 378.45421999999996, "r_x1": 59.30449699999999, "r_y1": 378.45421999999996, "r_x2": 59.30449699999999, "r_y2": 373.81232, "r_x3": 54.235424, "r_y3": 373.81232, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.295891, "r_y0": 490.36688, "r_x1": 122.16431, "r_y1": 490.36688, "r_x2": 122.16431, "r_y2": 484.53189, "r_x3": 85.295891, "r_y3": 484.53189, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.66599, "r_y0": 285.45572000000004, "r_x1": 265.3194, "r_y1": 285.45572000000004, "r_x2": 265.3194, "r_y2": 279.54607999999996, "r_x3": 229.66599, "r_y3": 279.54607999999996, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17369, "r_y0": 506.12943, "r_x1": 190.41711, "r_y1": 506.12943, "r_x2": 190.41711, "r_y2": 500.3031, "r_x3": 157.17369, "r_y3": 500.3031, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.81598999999997, "r_y0": 443.89206, "r_x1": 270.78442, "r_y1": 443.89206, "r_x2": 270.78442, "r_y2": 438.05542, "r_x3": 227.81598999999997, "r_y3": 438.05542, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.70262, "r_y0": 449.8904999999999, "r_x1": 263.51105, "r_y1": 449.8904999999999, "r_x2": 263.51105, "r_y2": 444.06183, "r_x3": 233.70262, "r_y3": 444.06183, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.74655, "r_y0": 298.75903, "r_x1": 212.16055, "r_y1": 298.75903, "r_x2": 212.16055, "r_y2": 293.39502, "r_x3": 184.74655, "r_y3": 293.39502, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91229, "r_y0": 304.50903, "r_x1": 216.74378999999996, "r_y1": 304.50903, "r_x2": 216.74378999999996, "r_y2": 299.14502, "r_x3": 178.91229, "r_y3": 299.14502, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.24574, "r_y0": 287.84817999999996, "r_x1": 198.89099, "r_y1": 287.84817999999996, "r_x2": 198.89099, "r_y2": 282.7822, "r_x3": 194.24574, "r_y3": 282.7822, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.45587, "r_y0": 277.82916, "r_x1": 276.47089, "r_y1": 277.82916, "r_x2": 276.47089, "r_y2": 271.86914, "r_x3": 221.45587, "r_y3": 271.86914, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65219, "r_y0": 329.10443, "r_x1": 197.29019, "r_y1": 329.10443, "r_x2": 197.29019, "r_y2": 323.44241, "r_x3": 151.65219, "r_y3": 323.44241, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43277, "r_y0": 335.10443, "r_x1": 184.19028, "r_y1": 335.10443, "r_x2": 184.19028, "r_y2": 329.44241, "r_x3": 163.43277, "r_y3": 329.44241, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 70, "label": "text", "bbox": { "l": 74.253464, "t": 258.21472000000006, "r": 101.75846, "b": 264.17474000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.253464, "r_y0": 264.17474000000004, "r_x1": 101.75846, "r_y1": 264.17474000000004, "r_x2": 101.75846, "r_y2": 258.21472000000006, "r_x3": 74.253464, "r_y3": 258.21472000000006, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 122.29972, "t": 258.34520999999995, "r": 157.83972, "b": 264.30524, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.29972, "r_y0": 264.30524, "r_x1": 157.83972, "r_y1": 264.30524, "r_x2": 157.83972, "r_y2": 258.34520999999995, "r_x3": 122.29972, "r_y3": 258.34520999999995, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 78.549347, "t": 371.38579999999996, "r": 125.68359000000001, "b": 377.04782, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.549347, "r_y0": 377.04782, "r_x1": 125.68359000000001, "r_y1": 377.04782, "r_x2": 125.68359000000001, "r_y2": 371.38579999999996, "r_x3": 78.549347, "r_y3": 371.38579999999996, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 78.513298, "t": 391.31857, "r": 84.644547, "b": 396.98059, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.513298, "r_y0": 396.98059, "r_x1": 84.644547, "r_y1": 396.98059, "r_x2": 84.644547, "r_y2": 391.31857, "r_x3": 78.513298, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 116.52705, "t": 391.31857, "r": 125.11079999999998, "b": 396.98059, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.52705, "r_y0": 396.98059, "r_x1": 125.11079999999998, "r_y1": 396.98059, "r_x2": 125.11079999999998, "r_y2": 391.31857, "r_x3": 116.52705, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 76.024773, "t": 424.45309, "r": 127.92327000000002, "b": 430.11511, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.024773, "r_y0": 430.11511, "r_x1": 127.92327000000002, "r_y1": 430.11511, "r_x2": 127.92327000000002, "r_y2": 424.45309, "r_x3": 76.024773, "r_y3": 424.45309, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 78.382828, "t": 444.88956, "r": 84.514076, "b": 450.55157, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.382828, "r_y0": 450.55157, "r_x1": 84.514076, "r_y1": 450.55157, "r_x2": 84.514076, "r_y2": 444.88956, "r_x3": 78.382828, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 116.39658, "t": 444.88956, "r": 124.98033, "b": 450.55157, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.39658, "r_y0": 450.55157, "r_x1": 124.98033, "r_y1": 450.55157, "r_x2": 124.98033, "r_y2": 444.88956, "r_x3": 116.39658, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 167.46945, "t": 462.44324, "r": 181.6292, "b": 468.10526, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.46945, "r_y0": 468.10526, "r_x1": 181.6292, "r_y1": 468.10526, "r_x2": 181.6292, "r_y2": 462.44324, "r_x3": 167.46945, "r_y3": 462.44324, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 165.61292, "t": 478.47107, "r": 184.43242, "b": 484.13309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61292, "r_y0": 484.13309, "r_x1": 184.43242, "r_y1": 484.13309, "r_x2": 184.43242, "r_y2": 478.47107, "r_x3": 165.61292, "r_y3": 478.47107, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 65.319511, "t": 324.26235999999994, "r": 132.9245, "b": 330.22235000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.319511, "r_y0": 330.22235000000006, "r_x1": 132.9245, "r_y1": 330.22235000000006, "r_x2": 132.9245, "r_y2": 324.26235999999994, "r_x3": 65.319511, "r_y3": 324.26235999999994, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 119.51457, "t": 269.66394, "r": 162.98782, "b": 274.72992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51457, "r_y0": 274.72992, "r_x1": 162.98782, "r_y1": 274.72992, "r_x2": 162.98782, "r_y2": 269.66394, "r_x3": 119.51457, "r_y3": 269.66394, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 128.72858, "t": 274.91394, "r": 151.41083, "b": 279.97992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.72858, "r_y0": 279.97992, "r_x1": 151.41083, "r_y1": 279.97992, "r_x2": 151.41083, "r_y2": 274.91394, "r_x3": 128.72858, "r_y3": 274.91394, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 60.434211999999995, "t": 338.95993, "r": 80.27021, "b": 344.26993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.434211999999995, "r_y0": 344.26993, "r_x1": 80.27021, "r_y1": 344.26993, "r_x2": 80.27021, "r_y2": 338.95993, "r_x3": 60.434211999999995, "r_y3": 338.95993, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 60.598457, "t": 343.38605, "r": 78.854958, "b": 348.69604, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.598457, "r_y0": 348.69604, "r_x1": 78.854958, "r_y1": 348.69604, "r_x2": 78.854958, "r_y2": 343.38605, "r_x3": 60.598457, "r_y3": 343.38605, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 134.82877, "t": 293.37762, "r": 154.66476, "b": 298.68762, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.82877, "r_y0": 298.68762, "r_x1": 154.66476, "r_y1": 298.68762, "r_x2": 154.66476, "r_y2": 293.37762, "r_x3": 134.82877, "r_y3": 293.37762, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 134.99303, "t": 297.80370999999997, "r": 153.24953, "b": 303.11371, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99303, "r_y0": 303.11371, "r_x1": 153.24953, "r_y1": 303.11371, "r_x2": 153.24953, "r_y2": 297.80370999999997, "r_x3": 134.99303, "r_y3": 297.80370999999997, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 150.55193, "t": 345.35861, "r": 197.14943, "b": 351.02063, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 351.02063, "r_x1": 197.14943, "r_y1": 351.02063, "r_x2": 197.14943, "r_y2": 345.35861, "r_x3": 150.55193, "r_y3": 345.35861, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 150.55193, "t": 394.4234, "r": 156.68318, "b": 400.08542, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 400.08542, "r_x1": 156.68318, "r_y1": 400.08542, "r_x2": 156.68318, "r_y2": 394.4234, "r_x3": 150.55193, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 188.56567, "t": 394.4234, "r": 197.14943, "b": 400.08542, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 400.08542, "r_x1": 197.14943, "r_y1": 400.08542, "r_x2": 197.14943, "r_y2": 394.4234, "r_x3": 188.56567, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 150.18539, "t": 375.66843, "r": 197.31964, "b": 381.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.18539, "r_y0": 381.33044, "r_x1": 197.31964, "r_y1": 381.33044, "r_x2": 197.31964, "r_y2": 375.66843, "r_x3": 150.18539, "r_y3": 375.66843, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 150.55193, "t": 440.24847000000005, "r": 156.68318, "b": 445.91049, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 445.91049, "r_x1": 156.68318, "r_y1": 445.91049, "r_x2": 156.68318, "r_y2": 440.24847000000005, "r_x3": 150.55193, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 188.56567, "t": 440.24847000000005, "r": 197.14943, "b": 445.91049, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 445.91049, "r_x1": 197.14943, "r_y1": 445.91049, "r_x2": 197.14943, "r_y2": 440.24847000000005, "r_x3": 188.56567, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 147.86377, "t": 422.09335, "r": 199.76227, "b": 427.75537, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86377, "r_y0": 427.75537, "r_x1": 199.76227, "r_y1": 427.75537, "r_x2": 199.76227, "r_y2": 422.09335, "r_x3": 147.86377, "r_y3": 422.09335, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 241.56567000000004, "t": 314.26285000000007, "r": 255.72542, "b": 319.92487, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.56567000000004, "r_y0": 319.92487, "r_x1": 255.72542, "r_y1": 319.92487, "r_x2": 255.72542, "r_y2": 314.26285000000007, "r_x3": 241.56567000000004, "r_y3": 314.26285000000007, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 241.91730000000004, "t": 361.36493, "r": 256.07706, "b": 367.02695, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.91730000000004, "r_y0": 367.02695, "r_x1": 256.07706, "r_y1": 367.02695, "r_x2": 256.07706, "r_y2": 361.36493, "r_x3": 241.91730000000004, "r_y3": 361.36493, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 228.054, "t": 336.61929000000003, "r": 248.72363000000004, "b": 342.28131, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.054, "r_y0": 342.28131, "r_x1": 248.72363000000004, "r_y1": 342.28131, "r_x2": 248.72363000000004, "r_y2": 336.61929000000003, "r_x3": 228.054, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 246.2919, "t": 336.61929000000003, "r": 269.39325, "b": 342.28131, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.2919, "r_y0": 342.28131, "r_x1": 269.39325, "r_y1": 342.28131, "r_x2": 269.39325, "r_y2": 336.61929000000003, "r_x3": 246.2919, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 228.44568000000004, "t": 405.14682, "r": 238.73892, "b": 410.80884, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.44568000000004, "r_y0": 410.80884, "r_x1": 238.73892, "r_y1": 410.80884, "r_x2": 238.73892, "r_y2": 405.14682, "r_x3": 228.44568000000004, "r_y3": 405.14682, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 256.29767, "t": 405.2032500000001, "r": 271.77792, "b": 410.86526, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.29767, "r_y0": 410.86526, "r_x1": 271.77792, "r_y1": 410.86526, "r_x2": 271.77792, "r_y2": 405.2032500000001, "r_x3": 256.29767, "r_y3": 405.2032500000001, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 239.54543, "t": 382.21344, "r": 258.08942, "b": 387.87546, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.54543, "r_y0": 387.87546, "r_x1": 258.08942, "r_y1": 387.87546, "r_x2": 258.08942, "r_y2": 382.21344, "r_x3": 239.54543, "r_y3": 382.21344, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 54.14704100000001, "t": 384.87183, "r": 59.51152, "b": 449.78326, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.14704100000001, "r_y0": 449.78326, "r_x1": 59.51152, "r_y1": 449.78326, "r_x2": 59.51152, "r_y2": 384.87183, "r_x3": 54.14704100000001, "r_y3": 384.87183, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 54.235424, "t": 373.81232, "r": 59.30449699999999, "b": 378.45421999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.235424, "r_y0": 378.45421999999996, "r_x1": 59.30449699999999, "r_y1": 378.45421999999996, "r_x2": 59.30449699999999, "r_y2": 373.81232, "r_x3": 54.235424, "r_y3": 373.81232, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 85.295891, "t": 484.53189, "r": 122.16431, "b": 490.36688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.295891, "r_y0": 490.36688, "r_x1": 122.16431, "r_y1": 490.36688, "r_x2": 122.16431, "r_y2": 484.53189, "r_x3": 85.295891, "r_y3": 484.53189, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 229.66599, "t": 279.54607999999996, "r": 265.3194, "b": 285.45572000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.66599, "r_y0": 285.45572000000004, "r_x1": 265.3194, "r_y1": 285.45572000000004, "r_x2": 265.3194, "r_y2": 279.54607999999996, "r_x3": 229.66599, "r_y3": 279.54607999999996, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 157.17369, "t": 500.3031, "r": 190.41711, "b": 506.12943, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17369, "r_y0": 506.12943, "r_x1": 190.41711, "r_y1": 506.12943, "r_x2": 190.41711, "r_y2": 500.3031, "r_x3": 157.17369, "r_y3": 500.3031, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 227.81598999999997, "t": 438.05542, "r": 270.78442, "b": 443.89206, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.81598999999997, "r_y0": 443.89206, "r_x1": 270.78442, "r_y1": 443.89206, "r_x2": 270.78442, "r_y2": 438.05542, "r_x3": 227.81598999999997, "r_y3": 438.05542, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 233.70262, "t": 444.06183, "r": 263.51105, "b": 449.8904999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.70262, "r_y0": 449.8904999999999, "r_x1": 263.51105, "r_y1": 449.8904999999999, "r_x2": 263.51105, "r_y2": 444.06183, "r_x3": 233.70262, "r_y3": 444.06183, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 184.74655, "t": 293.39502, "r": 212.16055, "b": 298.75903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.74655, "r_y0": 298.75903, "r_x1": 212.16055, "r_y1": 298.75903, "r_x2": 212.16055, "r_y2": 293.39502, "r_x3": 184.74655, "r_y3": 293.39502, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 178.91229, "t": 299.14502, "r": 216.74378999999996, "b": 304.50903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91229, "r_y0": 304.50903, "r_x1": 216.74378999999996, "r_y1": 304.50903, "r_x2": 216.74378999999996, "r_y2": 299.14502, "r_x3": 178.91229, "r_y3": 299.14502, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 194.24574, "t": 282.7822, "r": 198.89099, "b": 287.84817999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.24574, "r_y0": 287.84817999999996, "r_x1": 198.89099, "r_y1": 287.84817999999996, "r_x2": 198.89099, "r_y2": 282.7822, "r_x3": 194.24574, "r_y3": 282.7822, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 221.45587, "t": 271.86914, "r": 276.47089, "b": 277.82916, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.45587, "r_y0": 277.82916, "r_x1": 276.47089, "r_y1": 277.82916, "r_x2": 276.47089, "r_y2": 271.86914, "r_x3": 221.45587, "r_y3": 271.86914, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 151.65219, "t": 323.44241, "r": 197.29019, "b": 329.10443, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65219, "r_y0": 329.10443, "r_x1": 197.29019, "r_y1": 329.10443, "r_x2": 197.29019, "r_y2": 323.44241, "r_x3": 151.65219, "r_y3": 323.44241, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 163.43277, "t": 329.44241, "r": 184.19028, "b": 335.10443, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43277, "r_y0": 335.10443, "r_x1": 184.19028, "r_y1": 335.10443, "r_x2": 184.19028, "r_y2": 329.44241, "r_x3": 163.43277, "r_y3": 329.44241, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 8, "page_no": 4, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 50.112, "t": 527.7828099999999, "r": 286.36597, "b": 680.27094, "coord_origin": "TOPLEFT" }, "confidence": 0.8913407325744629, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 536.80893, "r_x1": 229.78752, "r_y1": 536.80893, "r_x2": 229.78752, "r_y2": 527.90237, "r_x3": 50.112, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.787, "r_y0": 536.7392, "r_x1": 267.76196, "r_y1": 536.7392, "r_x2": 267.76196, "r_y2": 527.7828099999999, "r_x3": 231.787, "r_y3": 527.7828099999999, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76401, "r_y0": 536.80893, "r_x1": 286.36169, "r_y1": 536.80893, "r_x2": 286.36169, "r_y2": 527.90237, "r_x3": 269.76401, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 548.76393, "r_x1": 286.36508, "r_y1": 548.76393, "r_x2": 286.36508, "r_y2": 539.85738, "r_x3": 50.112015, "r_y3": 539.85738, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 560.71992, "r_x1": 205.84735, "r_y1": 560.71992, "r_x2": 205.84735, "r_y2": 551.81337, "r_x3": 50.112015, "r_y3": 551.81337, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.01802, "r_y0": 560.6501900000001, "r_x1": 286.36392, "r_y1": 560.6501900000001, "r_x2": 286.36392, "r_y2": 551.69382, "r_x3": 208.01802, "r_y3": 551.69382, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 572.67493, "r_x1": 64.498009, "r_y1": 572.67493, "r_x2": 64.498009, "r_y2": 563.76837, "r_x3": 50.112015, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.165016, "r_y0": 572.60519, "r_x1": 151.31288, "r_y1": 572.60519, "r_x2": 151.31288, "r_y2": 563.64882, "r_x3": 68.165016, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31302, "r_y0": 572.67493, "r_x1": 153.80367, "r_y1": 572.67493, "r_x2": 153.80367, "r_y2": 563.76837, "r_x3": 151.31302, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.41884, "r_y0": 572.67493, "r_x1": 241.93283000000002, "r_y1": 572.67493, "r_x2": 241.93283000000002, "r_y2": 563.76837, "r_x3": 160.41884, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.59502, "r_y0": 572.60519, "r_x1": 286.362, "r_y1": 572.60519, "r_x2": 286.362, "r_y2": 563.64882, "r_x3": 245.59502, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 584.5602, "r_x1": 85.519089, "r_y1": 584.5602, "r_x2": 85.519089, "r_y2": 575.60382, "r_x3": 50.112015, "r_y3": 575.60382, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.623016, "r_y0": 584.6299300000001, "r_x1": 286.36072, "r_y1": 584.6299300000001, "r_x2": 286.36072, "r_y2": 575.7233699999999, "r_x3": 88.623016, "r_y3": 575.7233699999999, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 596.58493, "r_x1": 286.36511, "r_y1": 596.58493, "r_x2": 286.36511, "r_y2": 587.6783800000001, "r_x3": 50.112015, "r_y3": 587.6783800000001, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 608.53993, "r_x1": 286.36508, "r_y1": 608.53993, "r_x2": 286.36508, "r_y2": 599.63338, "r_x3": 50.112015, "r_y3": 599.63338, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 620.4949300000001, "r_x1": 240.43756000000002, "r_y1": 620.4949300000001, "r_x2": 240.43756000000002, "r_y2": 611.58838, "r_x3": 50.112015, "r_y3": 611.58838, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.19801, "r_y0": 620.4252, "r_x1": 286.36597, "r_y1": 620.4252, "r_x2": 286.36597, "r_y2": 611.46883, "r_x3": 243.19801, "r_y3": 611.46883, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 632.3812, "r_x1": 286.36511, "r_y1": 632.3812, "r_x2": 286.36511, "r_y2": 623.42482, "r_x3": 50.112015, "r_y3": 623.42482, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 644.3362, "r_x1": 286.36508, "r_y1": 644.3362, "r_x2": 286.36508, "r_y2": 635.37982, "r_x3": 50.112015, "r_y3": 635.37982, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 656.36093, "r_x1": 220.58205, "r_y1": 656.36093, "r_x2": 220.58205, "r_y2": 647.45438, "r_x3": 50.112015, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.57802000000004, "r_y0": 656.14175, "r_x1": 228.32693, "r_y1": 656.14175, "r_x2": 228.32693, "r_y2": 647.29497, "r_x3": 220.57802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.32700999999997, "r_y0": 656.36093, "r_x1": 236.07791000000003, "r_y1": 656.36093, "r_x2": 236.07791000000003, "r_y2": 647.45438, "r_x3": 228.32700999999997, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.07802000000004, "r_y0": 656.14175, "r_x1": 243.82693, "r_y1": 656.14175, "r_x2": 243.82693, "r_y2": 647.29497, "r_x3": 236.07802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.82602, "r_y0": 656.36093, "r_x1": 255.29298000000003, "r_y1": 656.36093, "r_x2": 255.29298000000003, "r_y2": 647.45438, "r_x3": 243.82602, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29102000000003, "r_y0": 656.14175, "r_x1": 263.03992, "r_y1": 656.14175, "r_x2": 263.03992, "r_y2": 647.29497, "r_x3": 255.29102000000003, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04001, "r_y0": 656.36093, "r_x1": 286.36246, "r_y1": 656.36093, "r_x2": 286.36246, "r_y2": 647.45438, "r_x3": 263.04001, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 668.31594, "r_x1": 286.36511, "r_y1": 668.31594, "r_x2": 286.36511, "r_y2": 659.40938, "r_x3": 50.112015, "r_y3": 659.40938, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 680.27094, "r_x1": 218.46996, "r_y1": 680.27094, "r_x2": 218.46996, "r_y2": 671.36438, "r_x3": 50.112015, "r_y3": 671.36438, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes." }, { "label": "text", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.862, "t": 249.53441999999995, "r": 545.11505, "b": 294.3069499999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9831458330154419, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.44097999999997, "r_x1": 523.05786, "r_y1": 258.44097999999997, "r_x2": 523.05786, "r_y2": 249.53441999999995, "r_x3": 308.862, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.19983, "r_y0": 258.44097999999997, "r_x1": 545.11505, "r_y1": 258.44097999999997, "r_x2": 545.11505, "r_y2": 249.53441999999995, "r_x3": 525.19983, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.39697, "r_x1": 517.55847, "r_y1": 270.39697, "r_x2": 517.55847, "r_y2": 261.49042, "r_x3": 308.862, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 270.39697, "r_x1": 545.11499, "r_y1": 270.39697, "r_x2": 545.11499, "r_y2": 261.49042, "r_x3": 520.76642, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.35196, "r_x1": 534.80377, "r_y1": 282.35196, "r_x2": 534.80377, "r_y2": 273.44537, "r_x3": 308.862, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36414, "r_y0": 282.35196, "r_x1": 545.11505, "r_y1": 282.35196, "r_x2": 545.11505, "r_y2": 273.44537, "r_x3": 537.36414, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.3069499999999, "r_x1": 341.24045, "r_y1": 294.3069499999999, "r_x2": 341.24045, "r_y2": 285.40039, "r_x3": 308.862, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73099, "r_y0": 294.07782000000003, "r_x1": 417.23508, "r_y1": 294.07782000000003, "r_x2": 417.23508, "r_y2": 285.49005, "r_x3": 343.73099, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23398, "r_y0": 294.3069499999999, "r_x1": 436.60129, "r_y1": 294.3069499999999, "r_x2": 436.60129, "r_y2": 285.40039, "r_x3": 417.23398, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09198, "r_y0": 294.07782000000003, "r_x1": 516.56116, "r_y1": 294.07782000000003, "r_x2": 516.56116, "r_y2": 285.49005, "r_x3": 439.09198, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56097, "r_y0": 294.3069499999999, "r_x1": 519.05164, "r_y1": 294.3069499999999, "r_x2": 519.05164, "r_y2": 285.40039, "r_x3": 516.56097, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86194, "t": 297.33981, "r": 545.11511, "b": 413.96182, "coord_origin": "TOPLEFT" }, "confidence": 0.9862009882926941, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 306.2962, "r_x1": 400.86649, "r_y1": 306.2962, "r_x2": 400.86649, "r_y2": 297.33981, "r_x3": 320.81696, "r_y3": 297.33981, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91394, "r_y0": 306.36594, "r_x1": 528.33685, "r_y1": 306.36594, "r_x2": 528.33685, "r_y2": 297.45938, "r_x3": 403.91394, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.7179, "r_y0": 306.36594, "r_x1": 545.11383, "r_y1": 306.36594, "r_x2": 545.11383, "r_y2": 297.45938, "r_x3": 530.7179, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 318.32092, "r_x1": 517.5285, "r_y1": 318.32092, "r_x2": 517.5285, "r_y2": 309.41437, "r_x3": 308.86194, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09387, "r_y0": 318.32092, "r_x1": 545.11493, "r_y1": 318.32092, "r_x2": 545.11493, "r_y2": 309.41437, "r_x3": 524.09387, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 330.27591, "r_x1": 432.35833999999994, "r_y1": 330.27591, "r_x2": 432.35833999999994, "r_y2": 321.36934999999994, "r_x3": 308.86194, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.81995000000006, "r_y0": 330.04678, "r_x1": 510.29041, "r_y1": 330.04678, "r_x2": 510.29041, "r_y2": 321.45901, "r_x3": 435.81995000000006, "r_y3": 321.45901, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.97797, "r_y0": 330.27591, "r_x1": 520.62305, "r_y1": 330.27591, "r_x2": 520.62305, "r_y2": 321.36934999999994, "r_x3": 513.97797, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08008, "r_y0": 330.27591, "r_x1": 545.11115, "r_y1": 330.27591, "r_x2": 545.11115, "r_y2": 321.36934999999994, "r_x3": 524.08008, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 342.2309, "r_x1": 527.76013, "r_y1": 342.2309, "r_x2": 527.76013, "r_y2": 333.32434, "r_x3": 308.86197, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.729, "r_y0": 342.2309, "r_x1": 545.11499, "r_y1": 342.2309, "r_x2": 545.11499, "r_y2": 333.32434, "r_x3": 530.729, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 354.18588, "r_x1": 526.85352, "r_y1": 354.18588, "r_x2": 526.85352, "r_y2": 345.27933, "r_x3": 308.86197, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62311, "r_y0": 354.18588, "r_x1": 545.11493, "r_y1": 354.18588, "r_x2": 545.11493, "r_y2": 345.27933, "r_x3": 529.62311, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 366.14188, "r_x1": 524.51245, "r_y1": 366.14188, "r_x2": 524.51245, "r_y2": 357.23532, "r_x3": 308.86197, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.96948, "r_y0": 366.14188, "r_x1": 545.11511, "r_y1": 366.14188, "r_x2": 545.11511, "r_y2": 357.23532, "r_x3": 527.96948, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 378.09685999999994, "r_x1": 370.39096, "r_y1": 378.09685999999994, "r_x2": 370.39096, "r_y2": 369.19031000000007, "r_x3": 308.86197, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44449, "r_y0": 378.09685999999994, "r_x1": 526.91339, "r_y1": 378.09685999999994, "r_x2": 526.91339, "r_y2": 369.19031000000007, "r_x3": 377.44449, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72906, "r_y0": 378.09685999999994, "r_x1": 545.11505, "r_y1": 378.09685999999994, "r_x2": 545.11505, "r_y2": 369.19031000000007, "r_x3": 530.72906, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 390.05185, "r_x1": 505.46395999999993, "r_y1": 390.05185, "r_x2": 505.46395999999993, "r_y2": 381.14529000000005, "r_x3": 308.86197, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03430000000003, "r_y0": 390.05185, "r_x1": 545.11511, "r_y1": 390.05185, "r_x2": 545.11511, "r_y2": 381.14529000000005, "r_x3": 508.03430000000003, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 402.00684, "r_x1": 517.68799, "r_y1": 402.00684, "r_x2": 517.68799, "r_y2": 393.10028, "r_x3": 308.86197, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 402.00684, "r_x1": 545.11499, "r_y1": 402.00684, "r_x2": 545.11499, "r_y2": 393.10028, "r_x3": 520.76642, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 413.96182, "r_x1": 528.01935, "r_y1": 413.96182, "r_x2": 528.01935, "r_y2": 405.05526999999995, "r_x3": 308.86197, "r_y3": 405.05526999999995, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. \"Scene Understanding\", \"Image Captioning\"), something which we relate to the simplicity of table images." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86197, "t": 417.11426, "r": 545.11511, "b": 545.57271, "coord_origin": "TOPLEFT" }, "confidence": 0.9851906895637512, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 426.02081, "r_x1": 515.49609, "r_y1": 426.02081, "r_x2": 515.49609, "r_y2": 417.11426, "r_x3": 320.81696, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.7663, "r_y0": 426.02081, "r_x1": 545.11487, "r_y1": 426.02081, "r_x2": 545.11487, "r_y2": 417.11426, "r_x3": 520.7663, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 437.9758, "r_x1": 343.72107, "r_y1": 437.9758, "r_x2": 343.72107, "r_y2": 429.0692399999999, "r_x3": 308.86197, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.03796, "r_y0": 437.74667, "r_x1": 446.45471000000003, "r_y1": 437.74667, "r_x2": 446.45471000000003, "r_y2": 429.15891, "r_x3": 347.03796, "r_y3": 429.15891, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.93996999999996, "r_y0": 437.9758, "r_x1": 503.06055000000003, "r_y1": 437.9758, "r_x2": 503.06055000000003, "r_y2": 429.0692399999999, "r_x3": 449.93996999999996, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.37808, "r_y0": 437.9758, "r_x1": 537.3717, "r_y1": 437.9758, "r_x2": 537.3717, "r_y2": 429.0692399999999, "r_x3": 506.37808, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.68927, "r_y0": 437.9758, "r_x1": 545.11267, "r_y1": 437.9758, "r_x2": 545.11267, "r_y2": 429.0692399999999, "r_x3": 540.68927, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 449.93079, "r_x1": 522.78894, "r_y1": 449.93079, "r_x2": 522.78894, "r_y2": 441.02423, "r_x3": 308.86197, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.7478, "r_y0": 449.93079, "r_x1": 545.11511, "r_y1": 449.93079, "r_x2": 545.11511, "r_y2": 441.02423, "r_x3": 525.7478, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 461.88577, "r_x1": 384.14929, "r_y1": 461.88577, "r_x2": 384.14929, "r_y2": 452.97922, "r_x3": 308.86197, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37466, "r_y0": 461.88577, "r_x1": 527.84985, "r_y1": 461.88577, "r_x2": 527.84985, "r_y2": 452.97922, "r_x3": 393.37466, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39282, "r_y0": 461.88577, "r_x1": 545.11505, "r_y1": 461.88577, "r_x2": 545.11505, "r_y2": 452.97922, "r_x3": 532.39282, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 473.84177, "r_x1": 529.7627, "r_y1": 473.84177, "r_x2": 529.7627, "r_y2": 464.93521, "r_x3": 308.86197, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94073, "r_y0": 473.84177, "r_x1": 545.11505, "r_y1": 473.84177, "r_x2": 545.11505, "r_y2": 464.93521, "r_x3": 532.94073, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 485.79675, "r_x1": 514.17126, "r_y1": 485.79675, "r_x2": 514.17126, "r_y2": 476.8902, "r_x3": 308.86197, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89105, "r_y0": 485.79675, "r_x1": 545.11511, "r_y1": 485.79675, "r_x2": 545.11511, "r_y2": 476.8902, "r_x3": 516.89105, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.75174, "r_x1": 527.63068, "r_y1": 497.75174, "r_x2": 527.63068, "r_y2": 488.84518, "r_x3": 308.86197, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62317, "r_y0": 497.75174, "r_x1": 545.11499, "r_y1": 497.75174, "r_x2": 545.11499, "r_y2": 488.84518, "r_x3": 529.62317, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.70673, "r_x1": 508.3630999999999, "r_y1": 509.70673, "r_x2": 508.3630999999999, "r_y2": 500.80017, "r_x3": 308.86197, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09286000000003, "r_y0": 509.70673, "r_x1": 545.11511, "r_y1": 509.70673, "r_x2": 545.11511, "r_y2": 500.80017, "r_x3": 511.09286000000003, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.6617100000001, "r_x1": 545.11499, "r_y1": 521.6617100000001, "r_x2": 545.11499, "r_y2": 512.7551599999999, "r_x3": 308.86197, "r_y3": 512.7551599999999, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.61771, "r_x1": 545.11511, "r_y1": 533.61771, "r_x2": 545.11511, "r_y2": 524.71115, "r_x3": 308.86197, "r_y3": 524.71115, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.57271, "r_x1": 369.73349, "r_y1": 545.57271, "r_x2": 369.73349, "r_y2": 536.66615, "r_x3": 308.86197, "r_y3": 536.66615, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score." }, { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86194, "t": 548.6046, "r": 545.11511, "b": 653.27271, "coord_origin": "TOPLEFT" }, "confidence": 0.9869195818901062, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 557.56097, "r_x1": 404.76184, "r_y1": 557.56097, "r_x2": 404.76184, "r_y2": 548.6046, "r_x3": 320.81696, "r_y3": 548.6046, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34094, "r_y0": 557.63071, "r_x1": 545.11505, "r_y1": 557.63071, "r_x2": 545.11505, "r_y2": 548.72415, "r_x3": 410.34094, "r_y3": 548.72415, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 569.5867000000001, "r_x1": 545.11493, "r_y1": 569.5867000000001, "r_x2": 545.11493, "r_y2": 560.68015, "r_x3": 308.86194, "r_y3": 560.68015, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 581.5417, "r_x1": 545.11511, "r_y1": 581.5417, "r_x2": 545.11511, "r_y2": 572.6351500000001, "r_x3": 308.86194, "r_y3": 572.6351500000001, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 593.4967, "r_x1": 545.11493, "r_y1": 593.4967, "r_x2": 545.11493, "r_y2": 584.59015, "r_x3": 308.86194, "r_y3": 584.59015, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 605.45171, "r_x1": 545.11499, "r_y1": 605.45171, "r_x2": 545.11499, "r_y2": 596.54515, "r_x3": 308.86194, "r_y3": 596.54515, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 617.40671, "r_x1": 545.11505, "r_y1": 617.40671, "r_x2": 545.11505, "r_y2": 608.50015, "r_x3": 308.86194, "r_y3": 608.50015, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 629.36171, "r_x1": 545.11505, "r_y1": 629.36171, "r_x2": 545.11505, "r_y2": 620.45515, "r_x3": 308.86194, "r_y3": 620.45515, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 641.3177000000001, "r_x1": 381.67859, "r_y1": 641.3177000000001, "r_x2": 381.67859, "r_y2": 632.41115, "r_x3": 308.86194, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.99695, "r_y0": 641.09853, "r_x1": 391.74585, "r_y1": 641.09853, "r_x2": 391.74585, "r_y2": 632.25174, "r_x3": 383.99695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.74594, "r_y0": 641.3177000000001, "r_x1": 399.49686, "r_y1": 641.3177000000001, "r_x2": 399.49686, "r_y2": 632.41115, "r_x3": 391.74594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.49695, "r_y0": 641.09853, "r_x1": 407.24585, "r_y1": 641.09853, "r_x2": 407.24585, "r_y2": 632.25174, "r_x3": 399.49695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.24594, "r_y0": 641.3177000000001, "r_x1": 432.90958, "r_y1": 641.3177000000001, "r_x2": 432.90958, "r_y2": 632.41115, "r_x3": 407.24594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.90792999999996, "r_y0": 641.09853, "r_x1": 440.65683000000007, "r_y1": 641.09853, "r_x2": 440.65683000000007, "r_y2": 632.25174, "r_x3": 432.90792999999996, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.65691999999996, "r_y0": 641.3177000000001, "r_x1": 545.11475, "r_y1": 641.3177000000001, "r_x2": 545.11475, "r_y2": 632.41115, "r_x3": 440.65691999999996, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 653.27271, "r_x1": 398.96371, "r_y1": 653.27271, "r_x2": 398.96371, "r_y2": 644.3661500000001, "r_x3": 308.86194, "r_y3": 644.3661500000001, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTML structure tags become the object query." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86194, "t": 656.42516, "r": 545.11505, "b": 713.151726, "coord_origin": "TOPLEFT" }, "confidence": 0.9852352142333984, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81693, "r_y0": 665.33172, "r_x1": 444.34316999999993, "r_y1": 665.33172, "r_x2": 444.34316999999993, "r_y2": 656.42516, "r_x3": 320.81693, "r_y3": 656.42516, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.00591999999995, "r_y0": 665.10258, "r_x1": 545.1076, "r_y1": 665.10258, "r_x2": 545.1076, "r_y2": 656.51482, "r_x3": 447.00591999999995, "r_y3": 656.51482, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 677.2867200000001, "r_x1": 545.11505, "r_y1": 677.2867200000001, "r_x2": 545.11505, "r_y2": 668.38016, "r_x3": 308.86194, "r_y3": 668.38016, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 689.24172, "r_x1": 545.11505, "r_y1": 689.24172, "r_x2": 545.11505, "r_y2": 680.33516, "r_x3": 308.86194, "r_y3": 680.33516, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 701.196724, "r_x1": 545.11505, "r_y1": 701.196724, "r_x2": 545.11505, "r_y2": 692.290161, "r_x3": 308.86194, "r_y3": 692.290161, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 713.151726, "r_x1": 545.11505, "r_y1": 713.151726, "r_x2": 545.11505, "r_y2": 704.245163, "r_x3": 308.86194, "r_y3": 704.245163, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-" }, { "label": "page_footer", "id": 9, "page_no": 4, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.12094, "t": 734.13316, "r": 300.10223, "b": 743.039722, "coord_origin": "TOPLEFT" }, "confidence": 0.8719564080238342, "cells": [ { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12094, "r_y0": 743.039722, "r_x1": 300.10223, "r_y1": 743.039722, "r_x2": 300.10223, "r_y2": 734.13316, "r_x3": 295.12094, "r_y3": 734.13316, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" } ], "body": [ { "label": "picture", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT" }, "confidence": 0.9296807646751404, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 125.62891000000002, "r_x1": 84.927567, "r_y1": 125.62891000000002, "r_x2": 84.927567, "r_y2": 122.43970000000002, "r_x3": 81.688072, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 125.62891000000002, "r_x1": 93.026291, "r_y1": 125.62891000000002, "r_x2": 93.026291, "r_y2": 122.43970000000002, "r_x3": 86.54731, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.50498, "r_y0": 118.44135000000006, "r_x1": 115.3461, "r_y1": 118.44135000000006, "r_x2": 115.3461, "r_y2": 115.25214000000005, "r_x3": 102.50498, "r_y3": 115.25214000000005, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.140205, "r_y0": 118.40410999999995, "r_x1": 93.291527, "r_y1": 118.40410999999995, "r_x2": 93.291527, "r_y2": 115.21489999999994, "r_x3": 82.140205, "r_y3": 115.21489999999994, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 125.62891000000002, "r_x1": 104.3119, "r_y1": 125.62891000000002, "r_x2": 104.3119, "r_y2": 122.43970000000002, "r_x3": 96.748268, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 130.93291999999997, "r_x1": 102.42083, "r_y1": 130.93291999999997, "r_x2": 102.42083, "r_y2": 127.74370999999985, "r_x3": 96.748268, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 136.6449, "r_x1": 104.3119, "r_y1": 136.6449, "r_x2": 104.3119, "r_y2": 133.45569, "r_x3": 96.748268, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 142.35693000000003, "r_x1": 102.42083, "r_y1": 142.35693000000003, "r_x2": 102.42083, "r_y2": 139.16772000000003, "r_x3": 96.748268, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 125.62891000000002, "r_x1": 116.14391, "r_y1": 125.62891000000002, "r_x2": 116.14391, "r_y2": 122.43970000000002, "r_x3": 110.66107, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 130.93291999999997, "r_x1": 116.14391, "r_y1": 130.93291999999997, "r_x2": 116.14391, "r_y2": 127.74370999999985, "r_x3": 110.66107, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 136.6449, "r_x1": 116.14391, "r_y1": 136.6449, "r_x2": 116.14391, "r_y2": 133.45569, "r_x3": 110.66107, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 142.35693000000003, "r_x1": 116.14391, "r_y1": 142.35693000000003, "r_x2": 116.14391, "r_y2": 139.16772000000003, "r_x3": 110.66107, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 130.93291999999997, "r_x1": 84.927567, "r_y1": 130.93291999999997, "r_x2": 84.927567, "r_y2": 127.74370999999985, "r_x3": 81.688072, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 130.93291999999997, "r_x1": 93.026291, "r_y1": 130.93291999999997, "r_x2": 93.026291, "r_y2": 127.74370999999985, "r_x3": 86.54731, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 136.6449, "r_x1": 84.927567, "r_y1": 136.6449, "r_x2": 84.927567, "r_y2": 133.45569, "r_x3": 81.688072, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 136.6449, "r_x1": 93.026291, "r_y1": 136.6449, "r_x2": 93.026291, "r_y2": 133.45569, "r_x3": 86.54731, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 142.35693000000003, "r_x1": 84.927567, "r_y1": 142.35693000000003, "r_x2": 84.927567, "r_y2": 139.16772000000003, "r_x3": 81.688072, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 142.35693000000003, "r_x1": 93.026291, "r_y1": 142.35693000000003, "r_x2": 93.026291, "r_y2": 139.16772000000003, "r_x3": 86.54731, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.084389, "r_y0": 96.23798, "r_x1": 113.93649, "r_y1": 96.23798, "r_x2": 113.93649, "r_y2": 90.49738000000002, "r_x3": 88.084389, "r_y3": 90.49738000000002, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81002, "r_y0": 103.37798999999995, "r_x1": 119.21240000000002, "r_y1": 103.37798999999995, "r_x2": 119.21240000000002, "r_y2": 97.63738999999998, "r_x3": 82.81002, "r_y3": 97.63738999999998, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94247, "r_y0": 106.34295999999995, "r_x1": 180.01131, "r_y1": 106.34295999999995, "r_x2": 180.01131, "r_y2": 100.60235999999998, "r_x3": 143.94247, "r_y3": 100.60235999999998, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94064, "r_y0": 113.48297000000014, "r_x1": 172.0118, "r_y1": 113.48297000000014, "r_x2": 172.0118, "r_y2": 107.74237000000005, "r_x3": 151.94064, "r_y3": 107.74237000000005, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.76939000000002, "r_y0": 86.67156999999997, "r_x1": 266.39557, "r_y1": 86.67156999999997, "r_x2": 266.39557, "r_y2": 80.93096999999989, "r_x3": 251.76939000000002, "r_y3": 80.93096999999989, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 91.77161000000001, "r_x1": 270.65021, "r_y1": 91.77161000000001, "r_x2": 270.65021, "r_y2": 86.03101000000004, "r_x3": 247.51601, "r_y3": 86.03101000000004, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.03699, "r_y0": 84.30042000000003, "r_x1": 352.12589, "r_y1": 84.30042000000003, "r_x2": 352.12589, "r_y2": 78.55980999999997, "r_x3": 331.03699, "r_y3": 78.55980999999997, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56421, "r_y0": 101.77282999999989, "r_x1": 431.7261, "r_y1": 101.77282999999989, "r_x2": 431.7261, "r_y2": 96.03223000000003, "r_x3": 390.56421, "r_y3": 96.03223000000003, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82422, "r_y0": 107.89287999999999, "r_x1": 435.46966999999995, "r_y1": 107.89287999999999, "r_x2": 435.46966999999995, "r_y2": 102.15228000000013, "r_x3": 386.82422, "r_y3": 102.15228000000013, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.69589, "r_y0": 114.01288000000011, "r_x1": 433.6032400000001, "r_y1": 114.01288000000011, "r_x2": 433.6032400000001, "r_y2": 108.27228000000002, "r_x3": 388.69589, "r_y3": 108.27228000000002, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.07761, "r_y0": 120.13286999999991, "r_x1": 431.22542999999996, "r_y1": 120.13286999999991, "r_x2": 431.22542999999996, "r_y2": 114.39227000000005, "r_x3": 391.07761, "r_y3": 114.39227000000005, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.22650000000004, "r_y0": 157.42571999999996, "r_x1": 498.82068, "r_y1": 157.42571999999996, "r_x2": 498.82068, "r_y2": 151.68511999999998, "r_x3": 431.22650000000004, "r_y3": 151.68511999999998, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.1738, "r_y0": 163.54578000000004, "r_x1": 498.87753000000004, "r_y1": 163.54578000000004, "r_x2": 498.87753000000004, "r_y2": 157.80517999999995, "r_x3": 431.1738, "r_y3": 157.80517999999995, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.5289, "r_y0": 169.66576999999995, "r_x1": 489.51827999999995, "r_y1": 169.66576999999995, "r_x2": 489.51827999999995, "r_y2": 163.92516999999998, "r_x3": 440.5289, "r_y3": 163.92516999999998, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37479, "r_y0": 183.99445000000003, "r_x1": 367.72333, "r_y1": 183.99445000000003, "r_x2": 367.72333, "r_y2": 178.25385000000006, "r_x3": 328.37479, "r_y3": 178.25385000000006, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 129.64948000000015, "r_x1": 373.67963, "r_y1": 129.64948000000015, "r_x2": 373.67963, "r_y2": 123.90886999999998, "r_x3": 331.84451, "r_y3": 123.90886999999998, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 134.74945000000002, "r_x1": 381.17786, "r_y1": 134.74945000000002, "r_x2": 381.17786, "r_y2": 129.00885000000017, "r_x3": 331.84451, "r_y3": 129.00885000000017, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.62633, "r_y0": 93.85681, "r_x1": 219.42332, "r_y1": 93.85681, "r_x2": 219.42332, "r_y2": 88.11621000000002, "r_x3": 196.62633, "r_y3": 88.11621000000002, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.66771, "r_y0": 135.23528999999996, "r_x1": 271.49899, "r_y1": 135.23528999999996, "r_x2": 271.49899, "r_y2": 129.4946900000001, "r_x3": 246.66771, "r_y3": 129.4946900000001, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 140.33533, "r_x1": 270.65021, "r_y1": 140.33533, "r_x2": 270.65021, "r_y2": 134.59473000000003, "r_x3": 247.51601, "r_y3": 134.59473000000003, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 94.75982999999997, "r_x1": 365.55347, "r_y1": 94.75982999999997, "r_x2": 365.55347, "r_y2": 89.01923, "r_x3": 330.63071, "r_y3": 89.01923, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 102.91985999999997, "r_x1": 370.22717, "r_y1": 102.91985999999997, "r_x2": 370.22717, "r_y2": 97.17926, "r_x3": 330.63071, "r_y3": 97.17926, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 111.07983000000002, "r_x1": 374.51157, "r_y1": 111.07983000000002, "r_x2": 374.51157, "r_y2": 105.33922999999993, "r_x3": 330.63071, "r_y3": 105.33922999999993, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 119.23987, "r_x1": 335.73233, "r_y1": 119.23987, "r_x2": 335.73233, "r_y2": 113.49926999999991, "r_x3": 330.63071, "r_y3": 113.49926999999991, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 146.57617000000005, "r_x1": 335.05988, "r_y1": 146.57617000000005, "r_x2": 335.05988, "r_y2": 141.79236000000003, "r_x3": 322.30579, "r_y3": 141.79236000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 153.71613000000002, "r_x1": 335.05988, "r_y1": 153.71613000000002, "r_x2": 335.05988, "r_y2": 148.93231000000003, "r_x3": 322.30579, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.54971, "r_y0": 154.29638999999997, "r_x1": 340.95242, "r_y1": 154.29638999999997, "r_x2": 340.95242, "r_y2": 148.55579, "r_x3": 337.54971, "r_y3": 148.55579, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56262, "r_y0": 153.71613000000002, "r_x1": 398.91446, "r_y1": 153.71613000000002, "r_x2": 398.91446, "r_y2": 148.93231000000003, "r_x3": 343.56262, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.41718, "r_y0": 153.71613000000002, "r_x1": 421.58801, "r_y1": 153.71613000000002, "r_x2": 421.58801, "r_y2": 148.93231000000003, "r_x3": 407.41718, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 160.85613999999998, "r_x1": 349.23022, "r_y1": 160.85613999999998, "r_x2": 349.23022, "r_y2": 156.07232999999997, "r_x3": 322.30579, "r_y3": 156.07232999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 167.99614999999994, "r_x1": 335.05988, "r_y1": 167.99614999999994, "r_x2": 335.05988, "r_y2": 163.21234000000004, "r_x3": 322.30579, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56155, "r_y0": 167.99614999999994, "r_x1": 374.73685, "r_y1": 167.99614999999994, "r_x2": 374.73685, "r_y2": 163.21234000000004, "r_x3": 343.56155, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 175.13617, "r_x1": 326.55716, "r_y1": 175.13617, "r_x2": 326.55716, "r_y2": 170.35235999999998, "r_x3": 322.30579, "r_y3": 170.35235999999998, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51111, "r_y0": 95.41027999999994, "r_x1": 326.91382, "r_y1": 95.41027999999994, "r_x2": 326.91382, "r_y2": 89.66967999999997, "r_x3": 323.51111, "r_y3": 89.66967999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 103.52948000000004, "r_x1": 327.1178, "r_y1": 103.52948000000004, "r_x2": 327.1178, "r_y2": 97.78887999999995, "r_x3": 323.71509, "r_y3": 97.78887999999995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 111.73029000000008, "r_x1": 327.1178, "r_y1": 111.73029000000008, "r_x2": 327.1178, "r_y2": 105.98969, "r_x3": 323.71509, "r_y3": 105.98969, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.4816, "r_y0": 154.28687000000002, "r_x1": 404.88431, "r_y1": 154.28687000000002, "r_x2": 404.88431, "r_y2": 148.54625999999996, "r_x3": 401.4816, "r_y3": 148.54625999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.6976, "r_y0": 168.42511000000002, "r_x1": 341.10031, "r_y1": 168.42511000000002, "r_x2": 341.10031, "r_y2": 162.68451000000005, "r_x3": 337.6976, "r_y3": 162.68451000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46378, "r_y0": 110.28644000000008, "r_x1": 457.86648999999994, "r_y1": 110.28644000000008, "r_x2": 457.86648999999994, "r_y2": 104.54584, "r_x3": 454.46378, "r_y3": 104.54584, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.32580999999993, "r_y0": 96.83605999999997, "r_x1": 496.72852, "r_y1": 96.83605999999997, "r_x2": 496.72852, "r_y2": 91.09546, "r_x3": 493.32580999999993, "r_y3": 91.09546, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08298, "r_y0": 96.30939000000001, "r_x1": 457.48569000000003, "r_y1": 96.30939000000001, "r_x2": 457.48569000000003, "r_y2": 90.56879000000015, "r_x3": 454.08298, "r_y3": 90.56879000000015, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 81.688072, "t": 122.43970000000002, "r": 84.927567, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 125.62891000000002, "r_x1": 84.927567, "r_y1": 125.62891000000002, "r_x2": 84.927567, "r_y2": 122.43970000000002, "r_x3": 81.688072, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 86.54731, "t": 122.43970000000002, "r": 93.026291, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 125.62891000000002, "r_x1": 93.026291, "r_y1": 125.62891000000002, "r_x2": 93.026291, "r_y2": 122.43970000000002, "r_x3": 86.54731, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 102.50498, "t": 115.25214000000005, "r": 115.3461, "b": 118.44135000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.50498, "r_y0": 118.44135000000006, "r_x1": 115.3461, "r_y1": 118.44135000000006, "r_x2": 115.3461, "r_y2": 115.25214000000005, "r_x3": 102.50498, "r_y3": 115.25214000000005, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 82.140205, "t": 115.21489999999994, "r": 93.291527, "b": 118.40410999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.140205, "r_y0": 118.40410999999995, "r_x1": 93.291527, "r_y1": 118.40410999999995, "r_x2": 93.291527, "r_y2": 115.21489999999994, "r_x3": 82.140205, "r_y3": 115.21489999999994, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 96.748268, "t": 122.43970000000002, "r": 104.3119, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 125.62891000000002, "r_x1": 104.3119, "r_y1": 125.62891000000002, "r_x2": 104.3119, "r_y2": 122.43970000000002, "r_x3": 96.748268, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 96.748268, "t": 127.74370999999985, "r": 102.42083, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 130.93291999999997, "r_x1": 102.42083, "r_y1": 130.93291999999997, "r_x2": 102.42083, "r_y2": 127.74370999999985, "r_x3": 96.748268, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 96.748268, "t": 133.45569, "r": 104.3119, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 136.6449, "r_x1": 104.3119, "r_y1": 136.6449, "r_x2": 104.3119, "r_y2": 133.45569, "r_x3": 96.748268, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 96.748268, "t": 139.16772000000003, "r": 102.42083, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.748268, "r_y0": 142.35693000000003, "r_x1": 102.42083, "r_y1": 142.35693000000003, "r_x2": 102.42083, "r_y2": 139.16772000000003, "r_x3": 96.748268, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 110.66107, "t": 122.43970000000002, "r": 116.14391, "b": 125.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 125.62891000000002, "r_x1": 116.14391, "r_y1": 125.62891000000002, "r_x2": 116.14391, "r_y2": 122.43970000000002, "r_x3": 110.66107, "r_y3": 122.43970000000002, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 110.66107, "t": 127.74370999999985, "r": 116.14391, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 130.93291999999997, "r_x1": 116.14391, "r_y1": 130.93291999999997, "r_x2": 116.14391, "r_y2": 127.74370999999985, "r_x3": 110.66107, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 110.66107, "t": 133.45569, "r": 116.14391, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 136.6449, "r_x1": 116.14391, "r_y1": 136.6449, "r_x2": 116.14391, "r_y2": 133.45569, "r_x3": 110.66107, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 110.66107, "t": 139.16772000000003, "r": 116.14391, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66107, "r_y0": 142.35693000000003, "r_x1": 116.14391, "r_y1": 142.35693000000003, "r_x2": 116.14391, "r_y2": 139.16772000000003, "r_x3": 110.66107, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 81.688072, "t": 127.74370999999985, "r": 84.927567, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 130.93291999999997, "r_x1": 84.927567, "r_y1": 130.93291999999997, "r_x2": 84.927567, "r_y2": 127.74370999999985, "r_x3": 81.688072, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 86.54731, "t": 127.74370999999985, "r": 93.026291, "b": 130.93291999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 130.93291999999997, "r_x1": 93.026291, "r_y1": 130.93291999999997, "r_x2": 93.026291, "r_y2": 127.74370999999985, "r_x3": 86.54731, "r_y3": 127.74370999999985, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 81.688072, "t": 133.45569, "r": 84.927567, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 136.6449, "r_x1": 84.927567, "r_y1": 136.6449, "r_x2": 84.927567, "r_y2": 133.45569, "r_x3": 81.688072, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 86.54731, "t": 133.45569, "r": 93.026291, "b": 136.6449, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 136.6449, "r_x1": 93.026291, "r_y1": 136.6449, "r_x2": 93.026291, "r_y2": 133.45569, "r_x3": 86.54731, "r_y3": 133.45569, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 81.688072, "t": 139.16772000000003, "r": 84.927567, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.688072, "r_y0": 142.35693000000003, "r_x1": 84.927567, "r_y1": 142.35693000000003, "r_x2": 84.927567, "r_y2": 139.16772000000003, "r_x3": 81.688072, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 86.54731, "t": 139.16772000000003, "r": 93.026291, "b": 142.35693000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.54731, "r_y0": 142.35693000000003, "r_x1": 93.026291, "r_y1": 142.35693000000003, "r_x2": 93.026291, "r_y2": 139.16772000000003, "r_x3": 86.54731, "r_y3": 139.16772000000003, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 88.084389, "t": 90.49738000000002, "r": 113.93649, "b": 96.23798, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.084389, "r_y0": 96.23798, "r_x1": 113.93649, "r_y1": 96.23798, "r_x2": 113.93649, "r_y2": 90.49738000000002, "r_x3": 88.084389, "r_y3": 90.49738000000002, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 82.81002, "t": 97.63738999999998, "r": 119.21240000000002, "b": 103.37798999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81002, "r_y0": 103.37798999999995, "r_x1": 119.21240000000002, "r_y1": 103.37798999999995, "r_x2": 119.21240000000002, "r_y2": 97.63738999999998, "r_x3": 82.81002, "r_y3": 97.63738999999998, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 143.94247, "t": 100.60235999999998, "r": 180.01131, "b": 106.34295999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94247, "r_y0": 106.34295999999995, "r_x1": 180.01131, "r_y1": 106.34295999999995, "r_x2": 180.01131, "r_y2": 100.60235999999998, "r_x3": 143.94247, "r_y3": 100.60235999999998, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 151.94064, "t": 107.74237000000005, "r": 172.0118, "b": 113.48297000000014, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94064, "r_y0": 113.48297000000014, "r_x1": 172.0118, "r_y1": 113.48297000000014, "r_x2": 172.0118, "r_y2": 107.74237000000005, "r_x3": 151.94064, "r_y3": 107.74237000000005, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 251.76939000000002, "t": 80.93096999999989, "r": 266.39557, "b": 86.67156999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.76939000000002, "r_y0": 86.67156999999997, "r_x1": 266.39557, "r_y1": 86.67156999999997, "r_x2": 266.39557, "r_y2": 80.93096999999989, "r_x3": 251.76939000000002, "r_y3": 80.93096999999989, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 247.51601, "t": 86.03101000000004, "r": 270.65021, "b": 91.77161000000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 91.77161000000001, "r_x1": 270.65021, "r_y1": 91.77161000000001, "r_x2": 270.65021, "r_y2": 86.03101000000004, "r_x3": 247.51601, "r_y3": 86.03101000000004, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 331.03699, "t": 78.55980999999997, "r": 352.12589, "b": 84.30042000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.03699, "r_y0": 84.30042000000003, "r_x1": 352.12589, "r_y1": 84.30042000000003, "r_x2": 352.12589, "r_y2": 78.55980999999997, "r_x3": 331.03699, "r_y3": 78.55980999999997, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 390.56421, "t": 96.03223000000003, "r": 431.7261, "b": 101.77282999999989, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56421, "r_y0": 101.77282999999989, "r_x1": 431.7261, "r_y1": 101.77282999999989, "r_x2": 431.7261, "r_y2": 96.03223000000003, "r_x3": 390.56421, "r_y3": 96.03223000000003, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 386.82422, "t": 102.15228000000013, "r": 435.46966999999995, "b": 107.89287999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82422, "r_y0": 107.89287999999999, "r_x1": 435.46966999999995, "r_y1": 107.89287999999999, "r_x2": 435.46966999999995, "r_y2": 102.15228000000013, "r_x3": 386.82422, "r_y3": 102.15228000000013, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 388.69589, "t": 108.27228000000002, "r": 433.6032400000001, "b": 114.01288000000011, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.69589, "r_y0": 114.01288000000011, "r_x1": 433.6032400000001, "r_y1": 114.01288000000011, "r_x2": 433.6032400000001, "r_y2": 108.27228000000002, "r_x3": 388.69589, "r_y3": 108.27228000000002, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 391.07761, "t": 114.39227000000005, "r": 431.22542999999996, "b": 120.13286999999991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.07761, "r_y0": 120.13286999999991, "r_x1": 431.22542999999996, "r_y1": 120.13286999999991, "r_x2": 431.22542999999996, "r_y2": 114.39227000000005, "r_x3": 391.07761, "r_y3": 114.39227000000005, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 431.22650000000004, "t": 151.68511999999998, "r": 498.82068, "b": 157.42571999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.22650000000004, "r_y0": 157.42571999999996, "r_x1": 498.82068, "r_y1": 157.42571999999996, "r_x2": 498.82068, "r_y2": 151.68511999999998, "r_x3": 431.22650000000004, "r_y3": 151.68511999999998, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 431.1738, "t": 157.80517999999995, "r": 498.87753000000004, "b": 163.54578000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.1738, "r_y0": 163.54578000000004, "r_x1": 498.87753000000004, "r_y1": 163.54578000000004, "r_x2": 498.87753000000004, "r_y2": 157.80517999999995, "r_x3": 431.1738, "r_y3": 157.80517999999995, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 440.5289, "t": 163.92516999999998, "r": 489.51827999999995, "b": 169.66576999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.5289, "r_y0": 169.66576999999995, "r_x1": 489.51827999999995, "r_y1": 169.66576999999995, "r_x2": 489.51827999999995, "r_y2": 163.92516999999998, "r_x3": 440.5289, "r_y3": 163.92516999999998, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 328.37479, "t": 178.25385000000006, "r": 367.72333, "b": 183.99445000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37479, "r_y0": 183.99445000000003, "r_x1": 367.72333, "r_y1": 183.99445000000003, "r_x2": 367.72333, "r_y2": 178.25385000000006, "r_x3": 328.37479, "r_y3": 178.25385000000006, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 331.84451, "t": 123.90886999999998, "r": 373.67963, "b": 129.64948000000015, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 129.64948000000015, "r_x1": 373.67963, "r_y1": 129.64948000000015, "r_x2": 373.67963, "r_y2": 123.90886999999998, "r_x3": 331.84451, "r_y3": 123.90886999999998, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 331.84451, "t": 129.00885000000017, "r": 381.17786, "b": 134.74945000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84451, "r_y0": 134.74945000000002, "r_x1": 381.17786, "r_y1": 134.74945000000002, "r_x2": 381.17786, "r_y2": 129.00885000000017, "r_x3": 331.84451, "r_y3": 129.00885000000017, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 196.62633, "t": 88.11621000000002, "r": 219.42332, "b": 93.85681, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.62633, "r_y0": 93.85681, "r_x1": 219.42332, "r_y1": 93.85681, "r_x2": 219.42332, "r_y2": 88.11621000000002, "r_x3": 196.62633, "r_y3": 88.11621000000002, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 246.66771, "t": 129.4946900000001, "r": 271.49899, "b": 135.23528999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.66771, "r_y0": 135.23528999999996, "r_x1": 271.49899, "r_y1": 135.23528999999996, "r_x2": 271.49899, "r_y2": 129.4946900000001, "r_x3": 246.66771, "r_y3": 129.4946900000001, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 247.51601, "t": 134.59473000000003, "r": 270.65021, "b": 140.33533, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.51601, "r_y0": 140.33533, "r_x1": 270.65021, "r_y1": 140.33533, "r_x2": 270.65021, "r_y2": 134.59473000000003, "r_x3": 247.51601, "r_y3": 134.59473000000003, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 330.63071, "t": 89.01923, "r": 365.55347, "b": 94.75982999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 94.75982999999997, "r_x1": 365.55347, "r_y1": 94.75982999999997, "r_x2": 365.55347, "r_y2": 89.01923, "r_x3": 330.63071, "r_y3": 89.01923, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 330.63071, "t": 97.17926, "r": 370.22717, "b": 102.91985999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 102.91985999999997, "r_x1": 370.22717, "r_y1": 102.91985999999997, "r_x2": 370.22717, "r_y2": 97.17926, "r_x3": 330.63071, "r_y3": 97.17926, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 330.63071, "t": 105.33922999999993, "r": 374.51157, "b": 111.07983000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 111.07983000000002, "r_x1": 374.51157, "r_y1": 111.07983000000002, "r_x2": 374.51157, "r_y2": 105.33922999999993, "r_x3": 330.63071, "r_y3": 105.33922999999993, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 330.63071, "t": 113.49926999999991, "r": 335.73233, "b": 119.23987, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63071, "r_y0": 119.23987, "r_x1": 335.73233, "r_y1": 119.23987, "r_x2": 335.73233, "r_y2": 113.49926999999991, "r_x3": 330.63071, "r_y3": 113.49926999999991, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 322.30579, "t": 141.79236000000003, "r": 335.05988, "b": 146.57617000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 146.57617000000005, "r_x1": 335.05988, "r_y1": 146.57617000000005, "r_x2": 335.05988, "r_y2": 141.79236000000003, "r_x3": 322.30579, "r_y3": 141.79236000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 322.30579, "t": 148.93231000000003, "r": 335.05988, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 153.71613000000002, "r_x1": 335.05988, "r_y1": 153.71613000000002, "r_x2": 335.05988, "r_y2": 148.93231000000003, "r_x3": 322.30579, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 337.54971, "t": 148.55579, "r": 340.95242, "b": 154.29638999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.54971, "r_y0": 154.29638999999997, "r_x1": 340.95242, "r_y1": 154.29638999999997, "r_x2": 340.95242, "r_y2": 148.55579, "r_x3": 337.54971, "r_y3": 148.55579, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 343.56262, "t": 148.93231000000003, "r": 398.91446, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56262, "r_y0": 153.71613000000002, "r_x1": 398.91446, "r_y1": 153.71613000000002, "r_x2": 398.91446, "r_y2": 148.93231000000003, "r_x3": 343.56262, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 407.41718, "t": 148.93231000000003, "r": 421.58801, "b": 153.71613000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.41718, "r_y0": 153.71613000000002, "r_x1": 421.58801, "r_y1": 153.71613000000002, "r_x2": 421.58801, "r_y2": 148.93231000000003, "r_x3": 407.41718, "r_y3": 148.93231000000003, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 322.30579, "t": 156.07232999999997, "r": 349.23022, "b": 160.85613999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 160.85613999999998, "r_x1": 349.23022, "r_y1": 160.85613999999998, "r_x2": 349.23022, "r_y2": 156.07232999999997, "r_x3": 322.30579, "r_y3": 156.07232999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 322.30579, "t": 163.21234000000004, "r": 335.05988, "b": 167.99614999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 167.99614999999994, "r_x1": 335.05988, "r_y1": 167.99614999999994, "r_x2": 335.05988, "r_y2": 163.21234000000004, "r_x3": 322.30579, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 343.56155, "t": 163.21234000000004, "r": 374.73685, "b": 167.99614999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56155, "r_y0": 167.99614999999994, "r_x1": 374.73685, "r_y1": 167.99614999999994, "r_x2": 374.73685, "r_y2": 163.21234000000004, "r_x3": 343.56155, "r_y3": 163.21234000000004, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 322.30579, "t": 170.35235999999998, "r": 326.55716, "b": 175.13617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.30579, "r_y0": 175.13617, "r_x1": 326.55716, "r_y1": 175.13617, "r_x2": 326.55716, "r_y2": 170.35235999999998, "r_x3": 322.30579, "r_y3": 170.35235999999998, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 323.51111, "t": 89.66967999999997, "r": 326.91382, "b": 95.41027999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51111, "r_y0": 95.41027999999994, "r_x1": 326.91382, "r_y1": 95.41027999999994, "r_x2": 326.91382, "r_y2": 89.66967999999997, "r_x3": 323.51111, "r_y3": 89.66967999999997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 323.71509, "t": 97.78887999999995, "r": 327.1178, "b": 103.52948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 103.52948000000004, "r_x1": 327.1178, "r_y1": 103.52948000000004, "r_x2": 327.1178, "r_y2": 97.78887999999995, "r_x3": 323.71509, "r_y3": 97.78887999999995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 323.71509, "t": 105.98969, "r": 327.1178, "b": 111.73029000000008, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.71509, "r_y0": 111.73029000000008, "r_x1": 327.1178, "r_y1": 111.73029000000008, "r_x2": 327.1178, "r_y2": 105.98969, "r_x3": 323.71509, "r_y3": 105.98969, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 401.4816, "t": 148.54625999999996, "r": 404.88431, "b": 154.28687000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.4816, "r_y0": 154.28687000000002, "r_x1": 404.88431, "r_y1": 154.28687000000002, "r_x2": 404.88431, "r_y2": 148.54625999999996, "r_x3": 401.4816, "r_y3": 148.54625999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 337.6976, "t": 162.68451000000005, "r": 341.10031, "b": 168.42511000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.6976, "r_y0": 168.42511000000002, "r_x1": 341.10031, "r_y1": 168.42511000000002, "r_x2": 341.10031, "r_y2": 162.68451000000005, "r_x3": 337.6976, "r_y3": 162.68451000000005, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 454.46378, "t": 104.54584, "r": 457.86648999999994, "b": 110.28644000000008, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46378, "r_y0": 110.28644000000008, "r_x1": 457.86648999999994, "r_y1": 110.28644000000008, "r_x2": 457.86648999999994, "r_y2": 104.54584, "r_x3": 454.46378, "r_y3": 104.54584, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 493.32580999999993, "t": 91.09546, "r": 496.72852, "b": 96.83605999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.32580999999993, "r_y0": 96.83605999999997, "r_x1": 496.72852, "r_y1": 96.83605999999997, "r_x2": 496.72852, "r_y2": 91.09546, "r_x3": 493.32580999999993, "r_y3": 91.09546, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 454.08298, "t": 90.56879000000015, "r": 457.48569000000003, "b": 96.30939000000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08298, "r_y0": 96.30939000000001, "r_x1": 457.48569000000003, "r_y1": 96.30939000000001, "r_x2": 457.48569000000003, "r_y2": 90.56879000000015, "r_x3": 454.08298, "r_y3": 90.56879000000015, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.111992, "t": 203.98577999999998, "r": 545.10846, "b": 224.96691999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9677652716636658, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 213.01189999999997, "r_x1": 86.883949, "r_y1": 213.01189999999997, "r_x2": 86.883949, "r_y2": 204.10535000000004, "r_x3": 50.112, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.020996, "r_y0": 212.94214, "r_x1": 149.85141, "r_y1": 212.94214, "r_x2": 149.85141, "r_y2": 203.98577999999998, "r_x3": 94.020996, "r_y3": 203.98577999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86099, "r_y0": 213.01189999999997, "r_x1": 545.10846, "r_y1": 213.01189999999997, "r_x2": 545.10846, "r_y2": 204.10535000000004, "r_x3": 152.86099, "r_y3": 204.10535000000004, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 224.96691999999996, "r_x1": 436.0134, "r_y1": 224.96691999999996, "r_x2": 436.0134, "r_y2": 216.06035999999995, "r_x3": 50.111992, "r_y3": 216.06035999999995, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure." }, { "label": "picture", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT" }, "confidence": 0.9724942445755005, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.253464, "r_y0": 264.17474000000004, "r_x1": 101.75846, "r_y1": 264.17474000000004, "r_x2": 101.75846, "r_y2": 258.21472000000006, "r_x3": 74.253464, "r_y3": 258.21472000000006, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.29972, "r_y0": 264.30524, "r_x1": 157.83972, "r_y1": 264.30524, "r_x2": 157.83972, "r_y2": 258.34520999999995, "r_x3": 122.29972, "r_y3": 258.34520999999995, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.549347, "r_y0": 377.04782, "r_x1": 125.68359000000001, "r_y1": 377.04782, "r_x2": 125.68359000000001, "r_y2": 371.38579999999996, "r_x3": 78.549347, "r_y3": 371.38579999999996, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.513298, "r_y0": 396.98059, "r_x1": 84.644547, "r_y1": 396.98059, "r_x2": 84.644547, "r_y2": 391.31857, "r_x3": 78.513298, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.52705, "r_y0": 396.98059, "r_x1": 125.11079999999998, "r_y1": 396.98059, "r_x2": 125.11079999999998, "r_y2": 391.31857, "r_x3": 116.52705, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.024773, "r_y0": 430.11511, "r_x1": 127.92327000000002, "r_y1": 430.11511, "r_x2": 127.92327000000002, "r_y2": 424.45309, "r_x3": 76.024773, "r_y3": 424.45309, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.382828, "r_y0": 450.55157, "r_x1": 84.514076, "r_y1": 450.55157, "r_x2": 84.514076, "r_y2": 444.88956, "r_x3": 78.382828, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.39658, "r_y0": 450.55157, "r_x1": 124.98033, "r_y1": 450.55157, "r_x2": 124.98033, "r_y2": 444.88956, "r_x3": 116.39658, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.46945, "r_y0": 468.10526, "r_x1": 181.6292, "r_y1": 468.10526, "r_x2": 181.6292, "r_y2": 462.44324, "r_x3": 167.46945, "r_y3": 462.44324, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61292, "r_y0": 484.13309, "r_x1": 184.43242, "r_y1": 484.13309, "r_x2": 184.43242, "r_y2": 478.47107, "r_x3": 165.61292, "r_y3": 478.47107, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.319511, "r_y0": 330.22235000000006, "r_x1": 132.9245, "r_y1": 330.22235000000006, "r_x2": 132.9245, "r_y2": 324.26235999999994, "r_x3": 65.319511, "r_y3": 324.26235999999994, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51457, "r_y0": 274.72992, "r_x1": 162.98782, "r_y1": 274.72992, "r_x2": 162.98782, "r_y2": 269.66394, "r_x3": 119.51457, "r_y3": 269.66394, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.72858, "r_y0": 279.97992, "r_x1": 151.41083, "r_y1": 279.97992, "r_x2": 151.41083, "r_y2": 274.91394, "r_x3": 128.72858, "r_y3": 274.91394, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.434211999999995, "r_y0": 344.26993, "r_x1": 80.27021, "r_y1": 344.26993, "r_x2": 80.27021, "r_y2": 338.95993, "r_x3": 60.434211999999995, "r_y3": 338.95993, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.598457, "r_y0": 348.69604, "r_x1": 78.854958, "r_y1": 348.69604, "r_x2": 78.854958, "r_y2": 343.38605, "r_x3": 60.598457, "r_y3": 343.38605, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.82877, "r_y0": 298.68762, "r_x1": 154.66476, "r_y1": 298.68762, "r_x2": 154.66476, "r_y2": 293.37762, "r_x3": 134.82877, "r_y3": 293.37762, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99303, "r_y0": 303.11371, "r_x1": 153.24953, "r_y1": 303.11371, "r_x2": 153.24953, "r_y2": 297.80370999999997, "r_x3": 134.99303, "r_y3": 297.80370999999997, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 351.02063, "r_x1": 197.14943, "r_y1": 351.02063, "r_x2": 197.14943, "r_y2": 345.35861, "r_x3": 150.55193, "r_y3": 345.35861, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 400.08542, "r_x1": 156.68318, "r_y1": 400.08542, "r_x2": 156.68318, "r_y2": 394.4234, "r_x3": 150.55193, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 400.08542, "r_x1": 197.14943, "r_y1": 400.08542, "r_x2": 197.14943, "r_y2": 394.4234, "r_x3": 188.56567, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.18539, "r_y0": 381.33044, "r_x1": 197.31964, "r_y1": 381.33044, "r_x2": 197.31964, "r_y2": 375.66843, "r_x3": 150.18539, "r_y3": 375.66843, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 445.91049, "r_x1": 156.68318, "r_y1": 445.91049, "r_x2": 156.68318, "r_y2": 440.24847000000005, "r_x3": 150.55193, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 445.91049, "r_x1": 197.14943, "r_y1": 445.91049, "r_x2": 197.14943, "r_y2": 440.24847000000005, "r_x3": 188.56567, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86377, "r_y0": 427.75537, "r_x1": 199.76227, "r_y1": 427.75537, "r_x2": 199.76227, "r_y2": 422.09335, "r_x3": 147.86377, "r_y3": 422.09335, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.56567000000004, "r_y0": 319.92487, "r_x1": 255.72542, "r_y1": 319.92487, "r_x2": 255.72542, "r_y2": 314.26285000000007, "r_x3": 241.56567000000004, "r_y3": 314.26285000000007, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.91730000000004, "r_y0": 367.02695, "r_x1": 256.07706, "r_y1": 367.02695, "r_x2": 256.07706, "r_y2": 361.36493, "r_x3": 241.91730000000004, "r_y3": 361.36493, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.054, "r_y0": 342.28131, "r_x1": 248.72363000000004, "r_y1": 342.28131, "r_x2": 248.72363000000004, "r_y2": 336.61929000000003, "r_x3": 228.054, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.2919, "r_y0": 342.28131, "r_x1": 269.39325, "r_y1": 342.28131, "r_x2": 269.39325, "r_y2": 336.61929000000003, "r_x3": 246.2919, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.44568000000004, "r_y0": 410.80884, "r_x1": 238.73892, "r_y1": 410.80884, "r_x2": 238.73892, "r_y2": 405.14682, "r_x3": 228.44568000000004, "r_y3": 405.14682, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.29767, "r_y0": 410.86526, "r_x1": 271.77792, "r_y1": 410.86526, "r_x2": 271.77792, "r_y2": 405.2032500000001, "r_x3": 256.29767, "r_y3": 405.2032500000001, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.54543, "r_y0": 387.87546, "r_x1": 258.08942, "r_y1": 387.87546, "r_x2": 258.08942, "r_y2": 382.21344, "r_x3": 239.54543, "r_y3": 382.21344, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.14704100000001, "r_y0": 449.78326, "r_x1": 59.51152, "r_y1": 449.78326, "r_x2": 59.51152, "r_y2": 384.87183, "r_x3": 54.14704100000001, "r_y3": 384.87183, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.235424, "r_y0": 378.45421999999996, "r_x1": 59.30449699999999, "r_y1": 378.45421999999996, "r_x2": 59.30449699999999, "r_y2": 373.81232, "r_x3": 54.235424, "r_y3": 373.81232, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.295891, "r_y0": 490.36688, "r_x1": 122.16431, "r_y1": 490.36688, "r_x2": 122.16431, "r_y2": 484.53189, "r_x3": 85.295891, "r_y3": 484.53189, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.66599, "r_y0": 285.45572000000004, "r_x1": 265.3194, "r_y1": 285.45572000000004, "r_x2": 265.3194, "r_y2": 279.54607999999996, "r_x3": 229.66599, "r_y3": 279.54607999999996, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17369, "r_y0": 506.12943, "r_x1": 190.41711, "r_y1": 506.12943, "r_x2": 190.41711, "r_y2": 500.3031, "r_x3": 157.17369, "r_y3": 500.3031, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.81598999999997, "r_y0": 443.89206, "r_x1": 270.78442, "r_y1": 443.89206, "r_x2": 270.78442, "r_y2": 438.05542, "r_x3": 227.81598999999997, "r_y3": 438.05542, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.70262, "r_y0": 449.8904999999999, "r_x1": 263.51105, "r_y1": 449.8904999999999, "r_x2": 263.51105, "r_y2": 444.06183, "r_x3": 233.70262, "r_y3": 444.06183, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.74655, "r_y0": 298.75903, "r_x1": 212.16055, "r_y1": 298.75903, "r_x2": 212.16055, "r_y2": 293.39502, "r_x3": 184.74655, "r_y3": 293.39502, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91229, "r_y0": 304.50903, "r_x1": 216.74378999999996, "r_y1": 304.50903, "r_x2": 216.74378999999996, "r_y2": 299.14502, "r_x3": 178.91229, "r_y3": 299.14502, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.24574, "r_y0": 287.84817999999996, "r_x1": 198.89099, "r_y1": 287.84817999999996, "r_x2": 198.89099, "r_y2": 282.7822, "r_x3": 194.24574, "r_y3": 282.7822, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.45587, "r_y0": 277.82916, "r_x1": 276.47089, "r_y1": 277.82916, "r_x2": 276.47089, "r_y2": 271.86914, "r_x3": 221.45587, "r_y3": 271.86914, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65219, "r_y0": 329.10443, "r_x1": 197.29019, "r_y1": 329.10443, "r_x2": 197.29019, "r_y2": 323.44241, "r_x3": 151.65219, "r_y3": 323.44241, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43277, "r_y0": 335.10443, "r_x1": 184.19028, "r_y1": 335.10443, "r_x2": 184.19028, "r_y2": 329.44241, "r_x3": 163.43277, "r_y3": 329.44241, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 70, "label": "text", "bbox": { "l": 74.253464, "t": 258.21472000000006, "r": 101.75846, "b": 264.17474000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.253464, "r_y0": 264.17474000000004, "r_x1": 101.75846, "r_y1": 264.17474000000004, "r_x2": 101.75846, "r_y2": 258.21472000000006, "r_x3": 74.253464, "r_y3": 258.21472000000006, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 122.29972, "t": 258.34520999999995, "r": 157.83972, "b": 264.30524, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.29972, "r_y0": 264.30524, "r_x1": 157.83972, "r_y1": 264.30524, "r_x2": 157.83972, "r_y2": 258.34520999999995, "r_x3": 122.29972, "r_y3": 258.34520999999995, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 78.549347, "t": 371.38579999999996, "r": 125.68359000000001, "b": 377.04782, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.549347, "r_y0": 377.04782, "r_x1": 125.68359000000001, "r_y1": 377.04782, "r_x2": 125.68359000000001, "r_y2": 371.38579999999996, "r_x3": 78.549347, "r_y3": 371.38579999999996, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 78.513298, "t": 391.31857, "r": 84.644547, "b": 396.98059, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.513298, "r_y0": 396.98059, "r_x1": 84.644547, "r_y1": 396.98059, "r_x2": 84.644547, "r_y2": 391.31857, "r_x3": 78.513298, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 116.52705, "t": 391.31857, "r": 125.11079999999998, "b": 396.98059, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.52705, "r_y0": 396.98059, "r_x1": 125.11079999999998, "r_y1": 396.98059, "r_x2": 125.11079999999998, "r_y2": 391.31857, "r_x3": 116.52705, "r_y3": 391.31857, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 76.024773, "t": 424.45309, "r": 127.92327000000002, "b": 430.11511, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.024773, "r_y0": 430.11511, "r_x1": 127.92327000000002, "r_y1": 430.11511, "r_x2": 127.92327000000002, "r_y2": 424.45309, "r_x3": 76.024773, "r_y3": 424.45309, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 78.382828, "t": 444.88956, "r": 84.514076, "b": 450.55157, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.382828, "r_y0": 450.55157, "r_x1": 84.514076, "r_y1": 450.55157, "r_x2": 84.514076, "r_y2": 444.88956, "r_x3": 78.382828, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 116.39658, "t": 444.88956, "r": 124.98033, "b": 450.55157, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.39658, "r_y0": 450.55157, "r_x1": 124.98033, "r_y1": 450.55157, "r_x2": 124.98033, "r_y2": 444.88956, "r_x3": 116.39658, "r_y3": 444.88956, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 167.46945, "t": 462.44324, "r": 181.6292, "b": 468.10526, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.46945, "r_y0": 468.10526, "r_x1": 181.6292, "r_y1": 468.10526, "r_x2": 181.6292, "r_y2": 462.44324, "r_x3": 167.46945, "r_y3": 462.44324, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 165.61292, "t": 478.47107, "r": 184.43242, "b": 484.13309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61292, "r_y0": 484.13309, "r_x1": 184.43242, "r_y1": 484.13309, "r_x2": 184.43242, "r_y2": 478.47107, "r_x3": 165.61292, "r_y3": 478.47107, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 65.319511, "t": 324.26235999999994, "r": 132.9245, "b": 330.22235000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.319511, "r_y0": 330.22235000000006, "r_x1": 132.9245, "r_y1": 330.22235000000006, "r_x2": 132.9245, "r_y2": 324.26235999999994, "r_x3": 65.319511, "r_y3": 324.26235999999994, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 119.51457, "t": 269.66394, "r": 162.98782, "b": 274.72992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51457, "r_y0": 274.72992, "r_x1": 162.98782, "r_y1": 274.72992, "r_x2": 162.98782, "r_y2": 269.66394, "r_x3": 119.51457, "r_y3": 269.66394, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 128.72858, "t": 274.91394, "r": 151.41083, "b": 279.97992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.72858, "r_y0": 279.97992, "r_x1": 151.41083, "r_y1": 279.97992, "r_x2": 151.41083, "r_y2": 274.91394, "r_x3": 128.72858, "r_y3": 274.91394, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 60.434211999999995, "t": 338.95993, "r": 80.27021, "b": 344.26993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.434211999999995, "r_y0": 344.26993, "r_x1": 80.27021, "r_y1": 344.26993, "r_x2": 80.27021, "r_y2": 338.95993, "r_x3": 60.434211999999995, "r_y3": 338.95993, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 60.598457, "t": 343.38605, "r": 78.854958, "b": 348.69604, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.598457, "r_y0": 348.69604, "r_x1": 78.854958, "r_y1": 348.69604, "r_x2": 78.854958, "r_y2": 343.38605, "r_x3": 60.598457, "r_y3": 343.38605, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 134.82877, "t": 293.37762, "r": 154.66476, "b": 298.68762, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.82877, "r_y0": 298.68762, "r_x1": 154.66476, "r_y1": 298.68762, "r_x2": 154.66476, "r_y2": 293.37762, "r_x3": 134.82877, "r_y3": 293.37762, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 134.99303, "t": 297.80370999999997, "r": 153.24953, "b": 303.11371, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99303, "r_y0": 303.11371, "r_x1": 153.24953, "r_y1": 303.11371, "r_x2": 153.24953, "r_y2": 297.80370999999997, "r_x3": 134.99303, "r_y3": 297.80370999999997, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 150.55193, "t": 345.35861, "r": 197.14943, "b": 351.02063, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 351.02063, "r_x1": 197.14943, "r_y1": 351.02063, "r_x2": 197.14943, "r_y2": 345.35861, "r_x3": 150.55193, "r_y3": 345.35861, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 150.55193, "t": 394.4234, "r": 156.68318, "b": 400.08542, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 400.08542, "r_x1": 156.68318, "r_y1": 400.08542, "r_x2": 156.68318, "r_y2": 394.4234, "r_x3": 150.55193, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 188.56567, "t": 394.4234, "r": 197.14943, "b": 400.08542, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 400.08542, "r_x1": 197.14943, "r_y1": 400.08542, "r_x2": 197.14943, "r_y2": 394.4234, "r_x3": 188.56567, "r_y3": 394.4234, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 150.18539, "t": 375.66843, "r": 197.31964, "b": 381.33044, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.18539, "r_y0": 381.33044, "r_x1": 197.31964, "r_y1": 381.33044, "r_x2": 197.31964, "r_y2": 375.66843, "r_x3": 150.18539, "r_y3": 375.66843, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 150.55193, "t": 440.24847000000005, "r": 156.68318, "b": 445.91049, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55193, "r_y0": 445.91049, "r_x1": 156.68318, "r_y1": 445.91049, "r_x2": 156.68318, "r_y2": 440.24847000000005, "r_x3": 150.55193, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 188.56567, "t": 440.24847000000005, "r": 197.14943, "b": 445.91049, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.56567, "r_y0": 445.91049, "r_x1": 197.14943, "r_y1": 445.91049, "r_x2": 197.14943, "r_y2": 440.24847000000005, "r_x3": 188.56567, "r_y3": 440.24847000000005, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 147.86377, "t": 422.09335, "r": 199.76227, "b": 427.75537, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86377, "r_y0": 427.75537, "r_x1": 199.76227, "r_y1": 427.75537, "r_x2": 199.76227, "r_y2": 422.09335, "r_x3": 147.86377, "r_y3": 422.09335, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 241.56567000000004, "t": 314.26285000000007, "r": 255.72542, "b": 319.92487, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.56567000000004, "r_y0": 319.92487, "r_x1": 255.72542, "r_y1": 319.92487, "r_x2": 255.72542, "r_y2": 314.26285000000007, "r_x3": 241.56567000000004, "r_y3": 314.26285000000007, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 241.91730000000004, "t": 361.36493, "r": 256.07706, "b": 367.02695, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.91730000000004, "r_y0": 367.02695, "r_x1": 256.07706, "r_y1": 367.02695, "r_x2": 256.07706, "r_y2": 361.36493, "r_x3": 241.91730000000004, "r_y3": 361.36493, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 228.054, "t": 336.61929000000003, "r": 248.72363000000004, "b": 342.28131, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.054, "r_y0": 342.28131, "r_x1": 248.72363000000004, "r_y1": 342.28131, "r_x2": 248.72363000000004, "r_y2": 336.61929000000003, "r_x3": 228.054, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 246.2919, "t": 336.61929000000003, "r": 269.39325, "b": 342.28131, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.2919, "r_y0": 342.28131, "r_x1": 269.39325, "r_y1": 342.28131, "r_x2": 269.39325, "r_y2": 336.61929000000003, "r_x3": 246.2919, "r_y3": 336.61929000000003, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 228.44568000000004, "t": 405.14682, "r": 238.73892, "b": 410.80884, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.44568000000004, "r_y0": 410.80884, "r_x1": 238.73892, "r_y1": 410.80884, "r_x2": 238.73892, "r_y2": 405.14682, "r_x3": 228.44568000000004, "r_y3": 405.14682, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 256.29767, "t": 405.2032500000001, "r": 271.77792, "b": 410.86526, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.29767, "r_y0": 410.86526, "r_x1": 271.77792, "r_y1": 410.86526, "r_x2": 271.77792, "r_y2": 405.2032500000001, "r_x3": 256.29767, "r_y3": 405.2032500000001, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 239.54543, "t": 382.21344, "r": 258.08942, "b": 387.87546, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.54543, "r_y0": 387.87546, "r_x1": 258.08942, "r_y1": 387.87546, "r_x2": 258.08942, "r_y2": 382.21344, "r_x3": 239.54543, "r_y3": 382.21344, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 54.14704100000001, "t": 384.87183, "r": 59.51152, "b": 449.78326, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.14704100000001, "r_y0": 449.78326, "r_x1": 59.51152, "r_y1": 449.78326, "r_x2": 59.51152, "r_y2": 384.87183, "r_x3": 54.14704100000001, "r_y3": 384.87183, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 54.235424, "t": 373.81232, "r": 59.30449699999999, "b": 378.45421999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.235424, "r_y0": 378.45421999999996, "r_x1": 59.30449699999999, "r_y1": 378.45421999999996, "r_x2": 59.30449699999999, "r_y2": 373.81232, "r_x3": 54.235424, "r_y3": 373.81232, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 85.295891, "t": 484.53189, "r": 122.16431, "b": 490.36688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.295891, "r_y0": 490.36688, "r_x1": 122.16431, "r_y1": 490.36688, "r_x2": 122.16431, "r_y2": 484.53189, "r_x3": 85.295891, "r_y3": 484.53189, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 229.66599, "t": 279.54607999999996, "r": 265.3194, "b": 285.45572000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.66599, "r_y0": 285.45572000000004, "r_x1": 265.3194, "r_y1": 285.45572000000004, "r_x2": 265.3194, "r_y2": 279.54607999999996, "r_x3": 229.66599, "r_y3": 279.54607999999996, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 157.17369, "t": 500.3031, "r": 190.41711, "b": 506.12943, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17369, "r_y0": 506.12943, "r_x1": 190.41711, "r_y1": 506.12943, "r_x2": 190.41711, "r_y2": 500.3031, "r_x3": 157.17369, "r_y3": 500.3031, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 227.81598999999997, "t": 438.05542, "r": 270.78442, "b": 443.89206, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.81598999999997, "r_y0": 443.89206, "r_x1": 270.78442, "r_y1": 443.89206, "r_x2": 270.78442, "r_y2": 438.05542, "r_x3": 227.81598999999997, "r_y3": 438.05542, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 233.70262, "t": 444.06183, "r": 263.51105, "b": 449.8904999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.70262, "r_y0": 449.8904999999999, "r_x1": 263.51105, "r_y1": 449.8904999999999, "r_x2": 263.51105, "r_y2": 444.06183, "r_x3": 233.70262, "r_y3": 444.06183, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 184.74655, "t": 293.39502, "r": 212.16055, "b": 298.75903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.74655, "r_y0": 298.75903, "r_x1": 212.16055, "r_y1": 298.75903, "r_x2": 212.16055, "r_y2": 293.39502, "r_x3": 184.74655, "r_y3": 293.39502, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 178.91229, "t": 299.14502, "r": 216.74378999999996, "b": 304.50903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91229, "r_y0": 304.50903, "r_x1": 216.74378999999996, "r_y1": 304.50903, "r_x2": 216.74378999999996, "r_y2": 299.14502, "r_x3": 178.91229, "r_y3": 299.14502, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 194.24574, "t": 282.7822, "r": 198.89099, "b": 287.84817999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.24574, "r_y0": 287.84817999999996, "r_x1": 198.89099, "r_y1": 287.84817999999996, "r_x2": 198.89099, "r_y2": 282.7822, "r_x3": 194.24574, "r_y3": 282.7822, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 221.45587, "t": 271.86914, "r": 276.47089, "b": 277.82916, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.45587, "r_y0": 277.82916, "r_x1": 276.47089, "r_y1": 277.82916, "r_x2": 276.47089, "r_y2": 271.86914, "r_x3": 221.45587, "r_y3": 271.86914, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 151.65219, "t": 323.44241, "r": 197.29019, "b": 329.10443, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65219, "r_y0": 329.10443, "r_x1": 197.29019, "r_y1": 329.10443, "r_x2": 197.29019, "r_y2": 323.44241, "r_x3": 151.65219, "r_y3": 323.44241, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 163.43277, "t": 329.44241, "r": 184.19028, "b": 335.10443, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43277, "r_y0": 335.10443, "r_x1": 184.19028, "r_y1": 335.10443, "r_x2": 184.19028, "r_y2": 329.44241, "r_x3": 163.43277, "r_y3": 329.44241, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 8, "page_no": 4, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 50.112, "t": 527.7828099999999, "r": 286.36597, "b": 680.27094, "coord_origin": "TOPLEFT" }, "confidence": 0.8913407325744629, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 536.80893, "r_x1": 229.78752, "r_y1": 536.80893, "r_x2": 229.78752, "r_y2": 527.90237, "r_x3": 50.112, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.787, "r_y0": 536.7392, "r_x1": 267.76196, "r_y1": 536.7392, "r_x2": 267.76196, "r_y2": 527.7828099999999, "r_x3": 231.787, "r_y3": 527.7828099999999, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76401, "r_y0": 536.80893, "r_x1": 286.36169, "r_y1": 536.80893, "r_x2": 286.36169, "r_y2": 527.90237, "r_x3": 269.76401, "r_y3": 527.90237, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 548.76393, "r_x1": 286.36508, "r_y1": 548.76393, "r_x2": 286.36508, "r_y2": 539.85738, "r_x3": 50.112015, "r_y3": 539.85738, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 560.71992, "r_x1": 205.84735, "r_y1": 560.71992, "r_x2": 205.84735, "r_y2": 551.81337, "r_x3": 50.112015, "r_y3": 551.81337, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.01802, "r_y0": 560.6501900000001, "r_x1": 286.36392, "r_y1": 560.6501900000001, "r_x2": 286.36392, "r_y2": 551.69382, "r_x3": 208.01802, "r_y3": 551.69382, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 572.67493, "r_x1": 64.498009, "r_y1": 572.67493, "r_x2": 64.498009, "r_y2": 563.76837, "r_x3": 50.112015, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.165016, "r_y0": 572.60519, "r_x1": 151.31288, "r_y1": 572.60519, "r_x2": 151.31288, "r_y2": 563.64882, "r_x3": 68.165016, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31302, "r_y0": 572.67493, "r_x1": 153.80367, "r_y1": 572.67493, "r_x2": 153.80367, "r_y2": 563.76837, "r_x3": 151.31302, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.41884, "r_y0": 572.67493, "r_x1": 241.93283000000002, "r_y1": 572.67493, "r_x2": 241.93283000000002, "r_y2": 563.76837, "r_x3": 160.41884, "r_y3": 563.76837, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.59502, "r_y0": 572.60519, "r_x1": 286.362, "r_y1": 572.60519, "r_x2": 286.362, "r_y2": 563.64882, "r_x3": 245.59502, "r_y3": 563.64882, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 584.5602, "r_x1": 85.519089, "r_y1": 584.5602, "r_x2": 85.519089, "r_y2": 575.60382, "r_x3": 50.112015, "r_y3": 575.60382, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.623016, "r_y0": 584.6299300000001, "r_x1": 286.36072, "r_y1": 584.6299300000001, "r_x2": 286.36072, "r_y2": 575.7233699999999, "r_x3": 88.623016, "r_y3": 575.7233699999999, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 596.58493, "r_x1": 286.36511, "r_y1": 596.58493, "r_x2": 286.36511, "r_y2": 587.6783800000001, "r_x3": 50.112015, "r_y3": 587.6783800000001, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 608.53993, "r_x1": 286.36508, "r_y1": 608.53993, "r_x2": 286.36508, "r_y2": 599.63338, "r_x3": 50.112015, "r_y3": 599.63338, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 620.4949300000001, "r_x1": 240.43756000000002, "r_y1": 620.4949300000001, "r_x2": 240.43756000000002, "r_y2": 611.58838, "r_x3": 50.112015, "r_y3": 611.58838, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.19801, "r_y0": 620.4252, "r_x1": 286.36597, "r_y1": 620.4252, "r_x2": 286.36597, "r_y2": 611.46883, "r_x3": 243.19801, "r_y3": 611.46883, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 632.3812, "r_x1": 286.36511, "r_y1": 632.3812, "r_x2": 286.36511, "r_y2": 623.42482, "r_x3": 50.112015, "r_y3": 623.42482, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 644.3362, "r_x1": 286.36508, "r_y1": 644.3362, "r_x2": 286.36508, "r_y2": 635.37982, "r_x3": 50.112015, "r_y3": 635.37982, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 656.36093, "r_x1": 220.58205, "r_y1": 656.36093, "r_x2": 220.58205, "r_y2": 647.45438, "r_x3": 50.112015, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.57802000000004, "r_y0": 656.14175, "r_x1": 228.32693, "r_y1": 656.14175, "r_x2": 228.32693, "r_y2": 647.29497, "r_x3": 220.57802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.32700999999997, "r_y0": 656.36093, "r_x1": 236.07791000000003, "r_y1": 656.36093, "r_x2": 236.07791000000003, "r_y2": 647.45438, "r_x3": 228.32700999999997, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.07802000000004, "r_y0": 656.14175, "r_x1": 243.82693, "r_y1": 656.14175, "r_x2": 243.82693, "r_y2": 647.29497, "r_x3": 236.07802000000004, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.82602, "r_y0": 656.36093, "r_x1": 255.29298000000003, "r_y1": 656.36093, "r_x2": 255.29298000000003, "r_y2": 647.45438, "r_x3": 243.82602, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29102000000003, "r_y0": 656.14175, "r_x1": 263.03992, "r_y1": 656.14175, "r_x2": 263.03992, "r_y2": 647.29497, "r_x3": 255.29102000000003, "r_y3": 647.29497, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04001, "r_y0": 656.36093, "r_x1": 286.36246, "r_y1": 656.36093, "r_x2": 286.36246, "r_y2": 647.45438, "r_x3": 263.04001, "r_y3": 647.45438, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 668.31594, "r_x1": 286.36511, "r_y1": 668.31594, "r_x2": 286.36511, "r_y2": 659.40938, "r_x3": 50.112015, "r_y3": 659.40938, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 680.27094, "r_x1": 218.46996, "r_y1": 680.27094, "r_x2": 218.46996, "r_y2": 671.36438, "r_x3": 50.112015, "r_y3": 671.36438, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes." }, { "label": "text", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.862, "t": 249.53441999999995, "r": 545.11505, "b": 294.3069499999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9831458330154419, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 258.44097999999997, "r_x1": 523.05786, "r_y1": 258.44097999999997, "r_x2": 523.05786, "r_y2": 249.53441999999995, "r_x3": 308.862, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.19983, "r_y0": 258.44097999999997, "r_x1": 545.11505, "r_y1": 258.44097999999997, "r_x2": 545.11505, "r_y2": 249.53441999999995, "r_x3": 525.19983, "r_y3": 249.53441999999995, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 270.39697, "r_x1": 517.55847, "r_y1": 270.39697, "r_x2": 517.55847, "r_y2": 261.49042, "r_x3": 308.862, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 270.39697, "r_x1": 545.11499, "r_y1": 270.39697, "r_x2": 545.11499, "r_y2": 261.49042, "r_x3": 520.76642, "r_y3": 261.49042, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 282.35196, "r_x1": 534.80377, "r_y1": 282.35196, "r_x2": 534.80377, "r_y2": 273.44537, "r_x3": 308.862, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36414, "r_y0": 282.35196, "r_x1": 545.11505, "r_y1": 282.35196, "r_x2": 545.11505, "r_y2": 273.44537, "r_x3": 537.36414, "r_y3": 273.44537, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 294.3069499999999, "r_x1": 341.24045, "r_y1": 294.3069499999999, "r_x2": 341.24045, "r_y2": 285.40039, "r_x3": 308.862, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73099, "r_y0": 294.07782000000003, "r_x1": 417.23508, "r_y1": 294.07782000000003, "r_x2": 417.23508, "r_y2": 285.49005, "r_x3": 343.73099, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23398, "r_y0": 294.3069499999999, "r_x1": 436.60129, "r_y1": 294.3069499999999, "r_x2": 436.60129, "r_y2": 285.40039, "r_x3": 417.23398, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09198, "r_y0": 294.07782000000003, "r_x1": 516.56116, "r_y1": 294.07782000000003, "r_x2": 516.56116, "r_y2": 285.49005, "r_x3": 439.09198, "r_y3": 285.49005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56097, "r_y0": 294.3069499999999, "r_x1": 519.05164, "r_y1": 294.3069499999999, "r_x2": 519.05164, "r_y2": 285.40039, "r_x3": 516.56097, "r_y3": 285.40039, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86194, "t": 297.33981, "r": 545.11511, "b": 413.96182, "coord_origin": "TOPLEFT" }, "confidence": 0.9862009882926941, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 306.2962, "r_x1": 400.86649, "r_y1": 306.2962, "r_x2": 400.86649, "r_y2": 297.33981, "r_x3": 320.81696, "r_y3": 297.33981, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91394, "r_y0": 306.36594, "r_x1": 528.33685, "r_y1": 306.36594, "r_x2": 528.33685, "r_y2": 297.45938, "r_x3": 403.91394, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.7179, "r_y0": 306.36594, "r_x1": 545.11383, "r_y1": 306.36594, "r_x2": 545.11383, "r_y2": 297.45938, "r_x3": 530.7179, "r_y3": 297.45938, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 318.32092, "r_x1": 517.5285, "r_y1": 318.32092, "r_x2": 517.5285, "r_y2": 309.41437, "r_x3": 308.86194, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09387, "r_y0": 318.32092, "r_x1": 545.11493, "r_y1": 318.32092, "r_x2": 545.11493, "r_y2": 309.41437, "r_x3": 524.09387, "r_y3": 309.41437, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 330.27591, "r_x1": 432.35833999999994, "r_y1": 330.27591, "r_x2": 432.35833999999994, "r_y2": 321.36934999999994, "r_x3": 308.86194, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.81995000000006, "r_y0": 330.04678, "r_x1": 510.29041, "r_y1": 330.04678, "r_x2": 510.29041, "r_y2": 321.45901, "r_x3": 435.81995000000006, "r_y3": 321.45901, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.97797, "r_y0": 330.27591, "r_x1": 520.62305, "r_y1": 330.27591, "r_x2": 520.62305, "r_y2": 321.36934999999994, "r_x3": 513.97797, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08008, "r_y0": 330.27591, "r_x1": 545.11115, "r_y1": 330.27591, "r_x2": 545.11115, "r_y2": 321.36934999999994, "r_x3": 524.08008, "r_y3": 321.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 342.2309, "r_x1": 527.76013, "r_y1": 342.2309, "r_x2": 527.76013, "r_y2": 333.32434, "r_x3": 308.86197, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.729, "r_y0": 342.2309, "r_x1": 545.11499, "r_y1": 342.2309, "r_x2": 545.11499, "r_y2": 333.32434, "r_x3": 530.729, "r_y3": 333.32434, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 354.18588, "r_x1": 526.85352, "r_y1": 354.18588, "r_x2": 526.85352, "r_y2": 345.27933, "r_x3": 308.86197, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62311, "r_y0": 354.18588, "r_x1": 545.11493, "r_y1": 354.18588, "r_x2": 545.11493, "r_y2": 345.27933, "r_x3": 529.62311, "r_y3": 345.27933, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 366.14188, "r_x1": 524.51245, "r_y1": 366.14188, "r_x2": 524.51245, "r_y2": 357.23532, "r_x3": 308.86197, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.96948, "r_y0": 366.14188, "r_x1": 545.11511, "r_y1": 366.14188, "r_x2": 545.11511, "r_y2": 357.23532, "r_x3": 527.96948, "r_y3": 357.23532, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 378.09685999999994, "r_x1": 370.39096, "r_y1": 378.09685999999994, "r_x2": 370.39096, "r_y2": 369.19031000000007, "r_x3": 308.86197, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44449, "r_y0": 378.09685999999994, "r_x1": 526.91339, "r_y1": 378.09685999999994, "r_x2": 526.91339, "r_y2": 369.19031000000007, "r_x3": 377.44449, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72906, "r_y0": 378.09685999999994, "r_x1": 545.11505, "r_y1": 378.09685999999994, "r_x2": 545.11505, "r_y2": 369.19031000000007, "r_x3": 530.72906, "r_y3": 369.19031000000007, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 390.05185, "r_x1": 505.46395999999993, "r_y1": 390.05185, "r_x2": 505.46395999999993, "r_y2": 381.14529000000005, "r_x3": 308.86197, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03430000000003, "r_y0": 390.05185, "r_x1": 545.11511, "r_y1": 390.05185, "r_x2": 545.11511, "r_y2": 381.14529000000005, "r_x3": 508.03430000000003, "r_y3": 381.14529000000005, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 402.00684, "r_x1": 517.68799, "r_y1": 402.00684, "r_x2": 517.68799, "r_y2": 393.10028, "r_x3": 308.86197, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.76642, "r_y0": 402.00684, "r_x1": 545.11499, "r_y1": 402.00684, "r_x2": 545.11499, "r_y2": 393.10028, "r_x3": 520.76642, "r_y3": 393.10028, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 413.96182, "r_x1": 528.01935, "r_y1": 413.96182, "r_x2": 528.01935, "r_y2": 405.05526999999995, "r_x3": 308.86197, "r_y3": 405.05526999999995, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. \"Scene Understanding\", \"Image Captioning\"), something which we relate to the simplicity of table images." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86197, "t": 417.11426, "r": 545.11511, "b": 545.57271, "coord_origin": "TOPLEFT" }, "confidence": 0.9851906895637512, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 426.02081, "r_x1": 515.49609, "r_y1": 426.02081, "r_x2": 515.49609, "r_y2": 417.11426, "r_x3": 320.81696, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.7663, "r_y0": 426.02081, "r_x1": 545.11487, "r_y1": 426.02081, "r_x2": 545.11487, "r_y2": 417.11426, "r_x3": 520.7663, "r_y3": 417.11426, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 437.9758, "r_x1": 343.72107, "r_y1": 437.9758, "r_x2": 343.72107, "r_y2": 429.0692399999999, "r_x3": 308.86197, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.03796, "r_y0": 437.74667, "r_x1": 446.45471000000003, "r_y1": 437.74667, "r_x2": 446.45471000000003, "r_y2": 429.15891, "r_x3": 347.03796, "r_y3": 429.15891, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.93996999999996, "r_y0": 437.9758, "r_x1": 503.06055000000003, "r_y1": 437.9758, "r_x2": 503.06055000000003, "r_y2": 429.0692399999999, "r_x3": 449.93996999999996, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.37808, "r_y0": 437.9758, "r_x1": 537.3717, "r_y1": 437.9758, "r_x2": 537.3717, "r_y2": 429.0692399999999, "r_x3": 506.37808, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.68927, "r_y0": 437.9758, "r_x1": 545.11267, "r_y1": 437.9758, "r_x2": 545.11267, "r_y2": 429.0692399999999, "r_x3": 540.68927, "r_y3": 429.0692399999999, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 449.93079, "r_x1": 522.78894, "r_y1": 449.93079, "r_x2": 522.78894, "r_y2": 441.02423, "r_x3": 308.86197, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.7478, "r_y0": 449.93079, "r_x1": 545.11511, "r_y1": 449.93079, "r_x2": 545.11511, "r_y2": 441.02423, "r_x3": 525.7478, "r_y3": 441.02423, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 461.88577, "r_x1": 384.14929, "r_y1": 461.88577, "r_x2": 384.14929, "r_y2": 452.97922, "r_x3": 308.86197, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37466, "r_y0": 461.88577, "r_x1": 527.84985, "r_y1": 461.88577, "r_x2": 527.84985, "r_y2": 452.97922, "r_x3": 393.37466, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39282, "r_y0": 461.88577, "r_x1": 545.11505, "r_y1": 461.88577, "r_x2": 545.11505, "r_y2": 452.97922, "r_x3": 532.39282, "r_y3": 452.97922, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 473.84177, "r_x1": 529.7627, "r_y1": 473.84177, "r_x2": 529.7627, "r_y2": 464.93521, "r_x3": 308.86197, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94073, "r_y0": 473.84177, "r_x1": 545.11505, "r_y1": 473.84177, "r_x2": 545.11505, "r_y2": 464.93521, "r_x3": 532.94073, "r_y3": 464.93521, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 485.79675, "r_x1": 514.17126, "r_y1": 485.79675, "r_x2": 514.17126, "r_y2": 476.8902, "r_x3": 308.86197, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89105, "r_y0": 485.79675, "r_x1": 545.11511, "r_y1": 485.79675, "r_x2": 545.11511, "r_y2": 476.8902, "r_x3": 516.89105, "r_y3": 476.8902, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 497.75174, "r_x1": 527.63068, "r_y1": 497.75174, "r_x2": 527.63068, "r_y2": 488.84518, "r_x3": 308.86197, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62317, "r_y0": 497.75174, "r_x1": 545.11499, "r_y1": 497.75174, "r_x2": 545.11499, "r_y2": 488.84518, "r_x3": 529.62317, "r_y3": 488.84518, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 509.70673, "r_x1": 508.3630999999999, "r_y1": 509.70673, "r_x2": 508.3630999999999, "r_y2": 500.80017, "r_x3": 308.86197, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09286000000003, "r_y0": 509.70673, "r_x1": 545.11511, "r_y1": 509.70673, "r_x2": 545.11511, "r_y2": 500.80017, "r_x3": 511.09286000000003, "r_y3": 500.80017, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 521.6617100000001, "r_x1": 545.11499, "r_y1": 521.6617100000001, "r_x2": 545.11499, "r_y2": 512.7551599999999, "r_x3": 308.86197, "r_y3": 512.7551599999999, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 533.61771, "r_x1": 545.11511, "r_y1": 533.61771, "r_x2": 545.11511, "r_y2": 524.71115, "r_x3": 308.86197, "r_y3": 524.71115, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 545.57271, "r_x1": 369.73349, "r_y1": 545.57271, "r_x2": 369.73349, "r_y2": 536.66615, "r_x3": 308.86197, "r_y3": 536.66615, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score." }, { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86194, "t": 548.6046, "r": 545.11511, "b": 653.27271, "coord_origin": "TOPLEFT" }, "confidence": 0.9869195818901062, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81696, "r_y0": 557.56097, "r_x1": 404.76184, "r_y1": 557.56097, "r_x2": 404.76184, "r_y2": 548.6046, "r_x3": 320.81696, "r_y3": 548.6046, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34094, "r_y0": 557.63071, "r_x1": 545.11505, "r_y1": 557.63071, "r_x2": 545.11505, "r_y2": 548.72415, "r_x3": 410.34094, "r_y3": 548.72415, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 569.5867000000001, "r_x1": 545.11493, "r_y1": 569.5867000000001, "r_x2": 545.11493, "r_y2": 560.68015, "r_x3": 308.86194, "r_y3": 560.68015, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 581.5417, "r_x1": 545.11511, "r_y1": 581.5417, "r_x2": 545.11511, "r_y2": 572.6351500000001, "r_x3": 308.86194, "r_y3": 572.6351500000001, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 593.4967, "r_x1": 545.11493, "r_y1": 593.4967, "r_x2": 545.11493, "r_y2": 584.59015, "r_x3": 308.86194, "r_y3": 584.59015, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 605.45171, "r_x1": 545.11499, "r_y1": 605.45171, "r_x2": 545.11499, "r_y2": 596.54515, "r_x3": 308.86194, "r_y3": 596.54515, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 617.40671, "r_x1": 545.11505, "r_y1": 617.40671, "r_x2": 545.11505, "r_y2": 608.50015, "r_x3": 308.86194, "r_y3": 608.50015, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 629.36171, "r_x1": 545.11505, "r_y1": 629.36171, "r_x2": 545.11505, "r_y2": 620.45515, "r_x3": 308.86194, "r_y3": 620.45515, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 641.3177000000001, "r_x1": 381.67859, "r_y1": 641.3177000000001, "r_x2": 381.67859, "r_y2": 632.41115, "r_x3": 308.86194, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.99695, "r_y0": 641.09853, "r_x1": 391.74585, "r_y1": 641.09853, "r_x2": 391.74585, "r_y2": 632.25174, "r_x3": 383.99695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.74594, "r_y0": 641.3177000000001, "r_x1": 399.49686, "r_y1": 641.3177000000001, "r_x2": 399.49686, "r_y2": 632.41115, "r_x3": 391.74594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.49695, "r_y0": 641.09853, "r_x1": 407.24585, "r_y1": 641.09853, "r_x2": 407.24585, "r_y2": 632.25174, "r_x3": 399.49695, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.24594, "r_y0": 641.3177000000001, "r_x1": 432.90958, "r_y1": 641.3177000000001, "r_x2": 432.90958, "r_y2": 632.41115, "r_x3": 407.24594, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.90792999999996, "r_y0": 641.09853, "r_x1": 440.65683000000007, "r_y1": 641.09853, "r_x2": 440.65683000000007, "r_y2": 632.25174, "r_x3": 432.90792999999996, "r_y3": 632.25174, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.65691999999996, "r_y0": 641.3177000000001, "r_x1": 545.11475, "r_y1": 641.3177000000001, "r_x2": 545.11475, "r_y2": 632.41115, "r_x3": 440.65691999999996, "r_y3": 632.41115, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 653.27271, "r_x1": 398.96371, "r_y1": 653.27271, "r_x2": 398.96371, "r_y2": 644.3661500000001, "r_x3": 308.86194, "r_y3": 644.3661500000001, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTML structure tags become the object query." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86194, "t": 656.42516, "r": 545.11505, "b": 713.151726, "coord_origin": "TOPLEFT" }, "confidence": 0.9852352142333984, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81693, "r_y0": 665.33172, "r_x1": 444.34316999999993, "r_y1": 665.33172, "r_x2": 444.34316999999993, "r_y2": 656.42516, "r_x3": 320.81693, "r_y3": 656.42516, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.00591999999995, "r_y0": 665.10258, "r_x1": 545.1076, "r_y1": 665.10258, "r_x2": 545.1076, "r_y2": 656.51482, "r_x3": 447.00591999999995, "r_y3": 656.51482, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 677.2867200000001, "r_x1": 545.11505, "r_y1": 677.2867200000001, "r_x2": 545.11505, "r_y2": 668.38016, "r_x3": 308.86194, "r_y3": 668.38016, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 689.24172, "r_x1": 545.11505, "r_y1": 689.24172, "r_x2": 545.11505, "r_y2": 680.33516, "r_x3": 308.86194, "r_y3": 680.33516, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 701.196724, "r_x1": 545.11505, "r_y1": 701.196724, "r_x2": 545.11505, "r_y2": 692.290161, "r_x3": 308.86194, "r_y3": 692.290161, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86194, "r_y0": 713.151726, "r_x1": 545.11505, "r_y1": 713.151726, "r_x2": 545.11505, "r_y2": 704.245163, "r_x3": 308.86194, "r_y3": 704.245163, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-" } ], "headers": [ { "label": "page_footer", "id": 9, "page_no": 4, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.12094, "t": 734.13316, "r": 300.10223, "b": 743.039722, "coord_origin": "TOPLEFT" }, "confidence": 0.8719564080238342, "cells": [ { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12094, "r_y0": 743.039722, "r_x1": 300.10223, "r_y1": 743.039722, "r_x2": 300.10223, "r_y2": 734.13316, "r_x3": 295.12094, "r_y3": 734.13316, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" } ] } }, { "page_no": 5, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36514, "r_y1": 84.11492999999996, "r_x2": 286.36514, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 286.36508, "r_y1": 96.06994999999995, "r_x2": 286.36508, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 286.36508, "r_y1": 108.02495999999985, "r_x2": 286.36508, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 119.97997999999984, "r_x1": 286.36508, "r_y1": 119.97997999999984, "r_x2": 286.36508, "r_y2": 111.07343000000003, "r_x3": 50.112, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.93499999999995, "r_x1": 286.36508, "r_y1": 131.93499999999995, "r_x2": 286.36508, "r_y2": 123.02844000000005, "r_x3": 50.112, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.89099, "r_x1": 286.36514, "r_y1": 143.89099, "r_x2": 286.36514, "r_y2": 134.98443999999995, "r_x3": 50.112, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.84600999999998, "r_x1": 175.16254, "r_y1": 155.84600999999998, "r_x2": 175.16254, "r_y2": 146.93944999999997, "r_x3": 50.112, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 168.53101000000004, "r_x1": 286.36496, "r_y1": 168.53101000000004, "r_x2": 286.36496, "r_y2": 159.62445000000002, "r_x3": 62.067001, "r_y3": 159.62445000000002, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.48699999999997, "r_x1": 286.36511, "r_y1": 180.48699999999997, "r_x2": 286.36511, "r_y2": 171.58043999999995, "r_x3": 50.112, "r_y3": 171.58043999999995, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.44201999999996, "r_x1": 286.36511, "r_y1": 192.44201999999996, "r_x2": 286.36511, "r_y2": 183.53545999999994, "r_x3": 50.112, "r_y3": 183.53545999999994, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.39702999999997, "r_x1": 286.36511, "r_y1": 204.39702999999997, "r_x2": 286.36511, "r_y2": 195.49048000000005, "r_x3": 50.112, "r_y3": 195.49048000000005, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.35204999999996, "r_x1": 286.36511, "r_y1": 216.35204999999996, "r_x2": 286.36511, "r_y2": 207.44550000000004, "r_x3": 50.112, "r_y3": 207.44550000000004, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.30706999999995, "r_x1": 286.36511, "r_y1": 228.30706999999995, "r_x2": 286.36511, "r_y2": 219.40051000000005, "r_x3": 50.112, "r_y3": 219.40051000000005, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 240.26306, "r_x1": 181.54855, "r_y1": 240.26306, "r_x2": 181.54855, "r_y2": 231.35650999999996, "r_x3": 50.112, "r_y3": 231.35650999999996, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.87829999999997, "r_x1": 129.21492, "r_y1": 252.87829999999997, "r_x2": 129.21492, "r_y2": 243.92193999999995, "r_x3": 62.067001, "r_y3": 243.92193999999995, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.451, "r_y0": 252.94806000000005, "r_x1": 286.36078, "r_y1": 252.94806000000005, "r_x2": 286.36078, "r_y2": 244.04150000000004, "r_x3": 134.451, "r_y3": 244.04150000000004, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 264.90308000000005, "r_x1": 286.36511, "r_y1": 264.90308000000005, "r_x2": 286.36511, "r_y2": 255.99652000000003, "r_x3": 50.112007, "r_y3": 255.99652000000003, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 276.63989000000004, "r_x1": 56.84528, "r_y1": 276.63989000000004, "r_x2": 56.84528, "r_y2": 267.79309, "r_x3": 50.112007, "r_y3": 267.79309, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.343006, "r_y0": 276.85907, "r_x1": 135.39996, "r_y1": 276.85907, "r_x2": 135.39996, "r_y2": 267.95250999999996, "r_x3": 57.343006, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.735, "r_y0": 276.62994000000003, "r_x1": 211.07965, "r_y1": 276.62994000000003, "r_x2": 211.07965, "r_y2": 268.04218000000003, "r_x3": 137.735, "r_y3": 268.04218000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.63699, "r_y0": 276.85907, "r_x1": 286.36395, "r_y1": 276.85907, "r_x2": 286.36395, "r_y2": 267.95250999999996, "r_x3": 213.63699, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.81406, "r_x1": 158.82388, "r_y1": 288.81406, "r_x2": 158.82388, "r_y2": 279.90747, "r_x3": 50.112, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.31799, "r_y0": 288.58493, "r_x1": 238.79712, "r_y1": 288.58493, "r_x2": 238.79712, "r_y2": 279.99712999999997, "r_x3": 161.31799, "r_y3": 279.99712999999997, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.521, "r_y0": 288.81406, "r_x1": 286.36264, "r_y1": 288.81406, "r_x2": 286.36264, "r_y2": 279.90747, "r_x3": 241.521, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.76904, "r_x1": 211.3766, "r_y1": 300.76904, "r_x2": 211.3766, "r_y2": 291.86249, "r_x3": 50.112, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.271, "r_y0": 300.54987, "r_x1": 229.19780000000003, "r_y1": 300.54987, "r_x2": 229.19780000000003, "r_y2": 291.70309, "r_x3": 214.271, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.696, "r_y0": 300.76904, "r_x1": 232.18665000000001, "r_y1": 300.76904, "r_x2": 232.18665000000001, "r_y2": 291.86249, "r_x3": 229.696, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49001, "r_y0": 300.54987, "r_x1": 251.41681000000003, "r_y1": 300.54987, "r_x2": 251.41681000000003, "r_y2": 291.70309, "r_x3": 236.49001, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81099999999998, "r_y0": 300.76904, "r_x1": 286.36255, "r_y1": 300.76904, "r_x2": 286.36255, "r_y2": 291.86249, "r_x3": 254.81099999999998, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.72403, "r_x1": 137.45412, "r_y1": 312.72403, "r_x2": 137.45412, "r_y2": 303.81747, "r_x3": 50.112, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.298, "r_y0": 312.50485, "r_x1": 148.24258, "r_y1": 312.50485, "r_x2": 148.24258, "r_y2": 303.65808, "r_x3": 141.298, "r_y3": 303.65808, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.58601, "r_y0": 312.72403, "r_x1": 286.36377, "r_y1": 312.72403, "r_x2": 286.36377, "r_y2": 303.81747, "r_x3": 152.58601, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 324.67902, "r_x1": 89.683464, "r_y1": 324.67902, "r_x2": 89.683464, "r_y2": 315.77245999999997, "r_x3": 50.112015, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.68602, "r_y0": 324.45984, "r_x1": 104.12046, "r_y1": 324.45984, "r_x2": 104.12046, "r_y2": 315.61307, "r_x3": 89.68602, "r_y3": 315.61307, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.61802, "r_y0": 324.67902, "r_x1": 286.36572, "r_y1": 324.67902, "r_x2": 286.36572, "r_y2": 315.77245999999997, "r_x3": 104.61802, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 336.6350100000001, "r_x1": 286.36511, "r_y1": 336.6350100000001, "r_x2": 286.36511, "r_y2": 327.72845, "r_x3": 50.112019, "r_y3": 327.72845, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 348.59, "r_x1": 286.36508, "r_y1": 348.59, "r_x2": 286.36508, "r_y2": 339.68344, "r_x3": 50.112019, "r_y3": 339.68344, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 360.54498, "r_x1": 286.36511, "r_y1": 360.54498, "r_x2": 286.36511, "r_y2": 351.63843, "r_x3": 50.112019, "r_y3": 351.63843, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 372.49996999999996, "r_x1": 286.36508, "r_y1": 372.49996999999996, "r_x2": 286.36508, "r_y2": 363.59341, "r_x3": 50.112019, "r_y3": 363.59341, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 384.45496, "r_x1": 286.36511, "r_y1": 384.45496, "r_x2": 286.36511, "r_y2": 375.5484, "r_x3": 50.112019, "r_y3": 375.5484, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 396.40994, "r_x1": 286.36514, "r_y1": 396.40994, "r_x2": 286.36514, "r_y2": 387.50339, "r_x3": 50.112019, "r_y3": 387.50339, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 408.36594, "r_x1": 88.68721, "r_y1": 408.36594, "r_x2": 88.68721, "r_y2": 399.45938, "r_x3": 50.112019, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.646019, "r_y0": 408.13681, "r_x1": 170.0517, "r_y1": 408.13681, "r_x2": 170.0517, "r_y2": 399.54904, "r_x3": 91.646019, "r_y3": 399.54904, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05103, "r_y0": 408.36594, "r_x1": 286.36438, "r_y1": 408.36594, "r_x2": 286.36438, "r_y2": 399.45938, "r_x3": 170.05103, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 420.32092, "r_x1": 181.96703, "r_y1": 420.32092, "r_x2": 181.96703, "r_y2": 411.41437, "r_x3": 50.112022, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09029, "r_y0": 420.32092, "r_x1": 197.74918, "r_y1": 420.32092, "r_x2": 197.74918, "r_y2": 411.41437, "r_x3": 189.09029, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.34789, "r_y0": 420.32092, "r_x1": 286.36511, "r_y1": 420.32092, "r_x2": 286.36511, "r_y2": 411.41437, "r_x3": 200.34789, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 432.27591, "r_x1": 286.36511, "r_y1": 432.27591, "r_x2": 286.36511, "r_y2": 423.36934999999994, "r_x3": 50.112022, "r_y3": 423.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 444.2309, "r_x1": 158.2959, "r_y1": 444.2309, "r_x2": 158.2959, "r_y2": 435.32434, "r_x3": 50.112022, "r_y3": 435.32434, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067024, "r_y0": 456.9169, "r_x1": 286.36499, "r_y1": 456.9169, "r_x2": 286.36499, "r_y2": 448.01035, "r_x3": 62.067024, "r_y3": 448.01035, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 468.87189, "r_x1": 91.377113, "r_y1": 468.87189, "r_x2": 91.377113, "r_y2": 459.96533, "r_x3": 50.112022, "r_y3": 459.96533, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.71502, "r_y0": 502.12772, "r_x1": 140.64182, "r_y1": 502.12772, "r_x2": 140.64182, "r_y2": 493.28094, "r_x3": 125.71502, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.90701, "r_y0": 502.12772, "r_x1": 151.65593, "r_y1": 502.12772, "r_x2": 151.65593, "r_y2": 493.28094, "r_x3": 143.90701, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42302, "r_y0": 502.12772, "r_x1": 186.62846, "r_y1": 502.12772, "r_x2": 186.62846, "r_y2": 493.28094, "r_x3": 154.42302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34003, "r_y0": 502.12772, "r_x1": 197.08894, "r_y1": 502.12772, "r_x2": 197.08894, "r_y2": 493.28094, "r_x3": 189.34003, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.30302, "r_y0": 502.12772, "r_x1": 211.64659, "r_y1": 502.12772, "r_x2": 211.64659, "r_y2": 493.28094, "r_x3": 199.30302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33002, "r_y0": 517.07172, "r_x1": 127.30286, "r_y1": 517.07172, "r_x2": 127.30286, "r_y2": 508.22495, "r_x3": 124.33002, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.26602, "r_y0": 517.07172, "r_x1": 138.01494, "r_y1": 517.07172, "r_x2": 138.01494, "r_y2": 508.22495, "r_x3": 130.26602, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78203, "r_y0": 517.07172, "r_x1": 153.32629, "r_y1": 517.07172, "r_x2": 153.32629, "r_y2": 508.22495, "r_x3": 140.78203, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.03903, "r_y0": 517.07172, "r_x1": 174.85541, "r_y1": 517.07172, "r_x2": 174.85541, "r_y2": 508.22495, "r_x3": 156.03903, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07103, "r_y0": 517.07172, "r_x1": 184.81995, "r_y1": 517.07172, "r_x2": 184.81995, "r_y2": 507.66702, "r_x3": 177.07103, "r_y3": 507.66702, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03304, "r_y0": 517.07172, "r_x1": 192.84422, "r_y1": 517.07172, "r_x2": 192.84422, "r_y2": 508.22495, "r_x3": 187.03304, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.84503, "r_y0": 517.07172, "r_x1": 196.71948, "r_y1": 517.07172, "r_x2": 196.71948, "r_y2": 508.22495, "r_x3": 192.84503, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.71902, "r_y0": 517.07172, "r_x1": 211.64583, "r_y1": 517.07172, "r_x2": 211.64583, "r_y2": 508.22495, "r_x3": 196.71902, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74603, "r_y0": 509.91788, "r_x1": 286.36243, "r_y1": 509.91788, "r_x2": 286.36243, "r_y2": 501.01132, "r_x3": 274.74603, "r_y3": 501.01132, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 540.21588, "r_x1": 74.450661, "r_y1": 540.21588, "r_x2": 74.450661, "r_y2": 531.30933, "r_x3": 50.11203, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.941032, "r_y0": 539.9967, "r_x1": 82.75222, "r_y1": 539.9967, "r_x2": 82.75222, "r_y2": 531.14993, "r_x3": 76.941032, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.520035, "r_y0": 539.9967, "r_x1": 92.162102, "r_y1": 539.9967, "r_x2": 92.162102, "r_y2": 530.5920100000001, "r_x3": 85.520035, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.653038, "r_y0": 540.21588, "r_x1": 135.59932, "r_y1": 540.21588, "r_x2": 135.59932, "r_y2": 531.30933, "r_x3": 94.653038, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09004, "r_y0": 539.9967, "r_x1": 172.63162, "r_y1": 539.9967, "r_x2": 172.63162, "r_y2": 531.14993, "r_x3": 138.09004, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.89705, "r_y0": 539.9967, "r_x1": 192.50104, "r_y1": 539.9967, "r_x2": 192.50104, "r_y2": 530.5920100000001, "r_x3": 175.89705, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99205, "r_y0": 540.21588, "r_x1": 281.59692, "r_y1": 540.21588, "r_x2": 281.59692, "r_y2": 531.30933, "r_x3": 194.99205, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 566.66461, "r_x1": 57.92831799999999, "r_y1": 566.66461, "r_x2": 57.92831799999999, "r_y2": 555.91689, "r_x3": 50.112045, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.350014, "r_y0": 566.66461, "r_x1": 171.98335, "r_y1": 566.66461, "r_x2": 171.98335, "r_y2": 555.91689, "r_x3": 68.350014, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 586.1163799999999, "r_x1": 64.693237, "r_y1": 586.1163799999999, "r_x2": 64.693237, "r_y2": 576.26433, "r_x3": 50.112045, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.414032, "r_y0": 586.1163799999999, "r_x1": 179.17502, "r_y1": 586.1163799999999, "r_x2": 179.17502, "r_y2": 576.26433, "r_x3": 74.414032, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067047, "r_y0": 604.64088, "r_x1": 202.97806, "r_y1": 604.64088, "r_x2": 202.97806, "r_y2": 595.73433, "r_x3": 62.067047, "r_y3": 595.73433, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38405, "r_y0": 604.41174, "r_x1": 286.36008, "r_y1": 604.41174, "r_x2": 286.36008, "r_y2": 595.82399, "r_x3": 205.38405, "r_y3": 595.82399, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 616.3667399999999, "r_x1": 70.037247, "r_y1": 616.3667399999999, "r_x2": 70.037247, "r_y2": 607.77899, "r_x3": 50.112045, "r_y3": 607.77899, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037048, "r_y0": 616.59589, "r_x1": 286.36496, "r_y1": 616.59589, "r_x2": 286.36496, "r_y2": 607.68933, "r_x3": 70.037048, "r_y3": 607.68933, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 628.55089, "r_x1": 286.36517, "r_y1": 628.55089, "r_x2": 286.36517, "r_y2": 619.64433, "r_x3": 50.112049, "r_y3": 619.64433, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 640.50688, "r_x1": 207.03294, "r_y1": 640.50688, "r_x2": 207.03294, "r_y2": 631.60033, "r_x3": 50.112049, "r_y3": 631.60033, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.661049, "r_y0": 663.45187, "r_x1": 186.01683, "r_y1": 663.45187, "r_x2": 186.01683, "r_y2": 654.54532, "r_x3": 91.661049, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.50705, "r_y0": 663.2327, "r_x1": 196.25597, "r_y1": 663.2327, "r_x2": 196.25597, "r_y2": 653.828, "r_x3": 188.50705, "r_y3": 653.828, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.74605, "r_y0": 663.45187, "r_x1": 244.81310999999997, "r_y1": 663.45187, "r_x2": 244.81310999999997, "r_y2": 654.54532, "r_x3": 198.74605, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.01604, "r_y0": 678.39588, "r_x1": 186.24606, "r_y1": 678.39588, "r_x2": 186.24606, "r_y2": 669.48932, "r_x3": 101.01604, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.73605, "r_y0": 678.1767, "r_x1": 196.48497, "r_y1": 678.1767, "r_x2": 196.48497, "r_y2": 668.77201, "r_x3": 188.73605, "r_y3": 668.77201, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.97505, "r_y0": 678.39588, "r_x1": 244.81296999999998, "r_y1": 678.39588, "r_x2": 244.81296999999998, "r_y2": 669.48932, "r_x3": 198.97505, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74606, "r_y0": 671.02388, "r_x1": 286.36246, "r_y1": 671.02388, "r_x2": 286.36246, "r_y2": 662.11731, "r_x3": 274.74606, "r_y3": 662.11731, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 701.196877, "r_x1": 286.36514, "r_y1": 701.196877, "r_x2": 286.36514, "r_y2": 692.290314, "r_x3": 50.112061, "r_y3": 692.290314, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 713.151878, "r_x1": 286.36514, "r_y1": 713.151878, "r_x2": 286.36514, "r_y2": 704.245316, "r_x3": 50.112061, "r_y3": 704.245316, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 84.11487, "r_x1": 545.11523, "r_y1": 84.11487, "r_x2": 545.11523, "r_y2": 75.20830999999998, "r_x3": 308.86206, "r_y3": 75.20830999999998, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 96.06988999999999, "r_x1": 339.98523, "r_y1": 96.06988999999999, "r_x2": 339.98523, "r_y2": 87.16332999999997, "r_x3": 308.86206, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.88931, "r_y0": 96.06988999999999, "r_x1": 545.11523, "r_y1": 96.06988999999999, "r_x2": 545.11523, "r_y2": 87.16332999999997, "r_x3": 346.88931, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 108.0249, "r_x1": 492.96097, "r_y1": 108.0249, "r_x2": 492.96097, "r_y2": 99.11835000000008, "r_x3": 308.86206, "r_y3": 99.11835000000008, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 125.13593000000003, "r_x1": 545.11499, "r_y1": 125.13593000000003, "r_x2": 545.11499, "r_y2": 116.22937000000002, "r_x3": 320.81705, "r_y3": 116.22937000000002, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 137.09094000000005, "r_x1": 545.11517, "r_y1": 137.09094000000005, "r_x2": 545.11517, "r_y2": 128.18439, "r_x3": 308.86206, "r_y3": 128.18439, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 149.04596000000004, "r_x1": 545.11505, "r_y1": 149.04596000000004, "r_x2": 545.11505, "r_y2": 140.13940000000002, "r_x3": 308.86206, "r_y3": 140.13940000000002, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 161.00098000000003, "r_x1": 545.11511, "r_y1": 161.00098000000003, "r_x2": 545.11511, "r_y2": 152.09442, "r_x3": 308.86206, "r_y3": 152.09442, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 172.95599000000004, "r_x1": 545.11517, "r_y1": 172.95599000000004, "r_x2": 545.11517, "r_y2": 164.04944, "r_x3": 308.86206, "r_y3": 164.04944, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 184.91198999999995, "r_x1": 467.21756000000005, "r_y1": 184.91198999999995, "r_x2": 467.21756000000005, "r_y2": 176.00543000000005, "r_x3": 308.86206, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.43671, "r_y0": 184.91198999999995, "r_x1": 545.11511, "r_y1": 184.91198999999995, "r_x2": 545.11511, "r_y2": 176.00543000000005, "r_x3": 475.43671, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 196.86699999999996, "r_x1": 545.11511, "r_y1": 196.86699999999996, "r_x2": 545.11511, "r_y2": 187.96045000000004, "r_x3": 308.86206, "r_y3": 187.96045000000004, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 208.82201999999995, "r_x1": 545.11511, "r_y1": 208.82201999999995, "r_x2": 545.11511, "r_y2": 199.91547000000003, "r_x3": 308.86206, "r_y3": 199.91547000000003, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 220.77704000000006, "r_x1": 545.11517, "r_y1": 220.77704000000006, "r_x2": 545.11517, "r_y2": 211.87048000000004, "r_x3": 308.86206, "r_y3": 211.87048000000004, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 232.73206000000005, "r_x1": 545.11511, "r_y1": 232.73206000000005, "r_x2": 545.11511, "r_y2": 223.82550000000003, "r_x3": 308.86206, "r_y3": 223.82550000000003, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 244.68706999999995, "r_x1": 545.11511, "r_y1": 244.68706999999995, "r_x2": 545.11511, "r_y2": 235.78052000000002, "r_x3": 308.86206, "r_y3": 235.78052000000002, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 256.64306999999997, "r_x1": 545.11523, "r_y1": 256.64306999999997, "r_x2": 545.11523, "r_y2": 247.73650999999995, "r_x3": 308.86206, "r_y3": 247.73650999999995, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 268.59808, "r_x1": 342.3364, "r_y1": 268.59808, "r_x2": 342.3364, "r_y2": 259.69152999999994, "r_x3": 308.86206, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95157, "r_y0": 268.59808, "r_x1": 545.11517, "r_y1": 268.59808, "r_x2": 545.11517, "r_y2": 259.69152999999994, "r_x3": 348.95157, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 280.55310000000003, "r_x1": 545.11517, "r_y1": 280.55310000000003, "r_x2": 545.11517, "r_y2": 271.64655000000005, "r_x3": 308.86206, "r_y3": 271.64655000000005, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 292.50809, "r_x1": 545.1153, "r_y1": 292.50809, "r_x2": 545.1153, "r_y2": 283.6015300000001, "r_x3": 308.86206, "r_y3": 283.6015300000001, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 304.46307, "r_x1": 545.11511, "r_y1": 304.46307, "r_x2": 545.11511, "r_y2": 295.55652, "r_x3": 308.86206, "r_y3": 295.55652, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 316.41806, "r_x1": 545.11511, "r_y1": 316.41806, "r_x2": 545.11511, "r_y2": 307.51151, "r_x3": 308.86206, "r_y3": 307.51151, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 328.37405, "r_x1": 532.48267, "r_y1": 328.37405, "r_x2": 532.48267, "r_y2": 319.4674999999999, "r_x3": 308.86206, "r_y3": 319.4674999999999, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 345.48407000000003, "r_x1": 545.11499, "r_y1": 345.48407000000003, "r_x2": 545.11499, "r_y2": 336.57751, "r_x3": 320.81705, "r_y3": 336.57751, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 357.43906, "r_x1": 403.7359, "r_y1": 357.43906, "r_x2": 403.7359, "r_y2": 348.5325000000001, "r_x3": 308.86206, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.07605, "r_y0": 357.20993, "r_x1": 503.54016, "r_y1": 357.20993, "r_x2": 503.54016, "r_y2": 348.62216, "r_x3": 406.07605, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.53906, "r_y0": 357.43906, "r_x1": 506.02972, "r_y1": 357.43906, "r_x2": 506.02972, "r_y2": 348.5325000000001, "r_x3": 503.53906, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.40004999999996, "r_y0": 357.20993, "r_x1": 545.11224, "r_y1": 357.20993, "r_x2": 545.11224, "r_y2": 348.62216, "r_x3": 508.40004999999996, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 369.16492000000005, "r_x1": 343.1633, "r_y1": 369.16492000000005, "r_x2": 343.1633, "r_y2": 360.57715, "r_x3": 308.86206, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16306, "r_y0": 369.39404, "r_x1": 362.2016, "r_y1": 369.39404, "r_x2": 362.2016, "r_y2": 360.48749, "r_x3": 343.16306, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.28604, "r_y0": 369.16492000000005, "r_x1": 440.93829, "r_y1": 369.16492000000005, "r_x2": 440.93829, "r_y2": 360.57715, "r_x3": 364.28604, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.93903, "r_y0": 369.39404, "r_x1": 545.10797, "r_y1": 369.39404, "r_x2": 545.10797, "r_y2": 360.48749, "r_x3": 440.93903, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 381.34903, "r_x1": 545.11511, "r_y1": 381.34903, "r_x2": 545.11511, "r_y2": 372.44247, "r_x3": 308.86203, "r_y3": 372.44247, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 393.30502, "r_x1": 545.11517, "r_y1": 393.30502, "r_x2": 545.11517, "r_y2": 384.3984699999999, "r_x3": 308.86203, "r_y3": 384.3984699999999, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 405.04083, "r_x1": 314.67322, "r_y1": 405.04083, "r_x2": 314.67322, "r_y2": 396.19406000000004, "r_x3": 308.86203, "r_y3": 396.19406000000004, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.65802, "r_y0": 405.2600100000001, "r_x1": 360.39139, "r_y1": 405.2600100000001, "r_x2": 360.39139, "r_y2": 396.35345, "r_x3": 318.65802, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96295, "r_y0": 405.2600100000001, "r_x1": 545.10803, "r_y1": 405.2600100000001, "r_x2": 545.10803, "r_y2": 396.35345, "r_x3": 367.96295, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 417.215, "r_x1": 545.11511, "r_y1": 417.215, "r_x2": 545.11511, "r_y2": 408.30844, "r_x3": 308.86203, "r_y3": 408.30844, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 429.16998, "r_x1": 360.9664, "r_y1": 429.16998, "r_x2": 360.9664, "r_y2": 420.26343, "r_x3": 308.86203, "r_y3": 420.26343, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 446.28098, "r_x1": 545.11499, "r_y1": 446.28098, "r_x2": 545.11499, "r_y2": 437.37441999999993, "r_x3": 320.81702, "r_y3": 437.37441999999993, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 458.23596, "r_x1": 384.62759, "r_y1": 458.23596, "r_x2": 384.62759, "r_y2": 449.32941, "r_x3": 308.86203, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37228, "r_y0": 458.23596, "r_x1": 545.11511, "r_y1": 458.23596, "r_x2": 545.11511, "r_y2": 449.32941, "r_x3": 391.37228, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 470.19095, "r_x1": 494.00693000000007, "r_y1": 470.19095, "r_x2": 494.00693000000007, "r_y2": 461.28439, "r_x3": 308.86203, "r_y3": 461.28439, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.07803, "r_y0": 469.96182, "r_x1": 545.11145, "r_y1": 469.96182, "r_x2": 545.11145, "r_y2": 461.37405, "r_x3": 498.07803, "r_y3": 461.37405, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 481.91681, "r_x1": 364.44336, "r_y1": 481.91681, "r_x2": 364.44336, "r_y2": 473.32904, "r_x3": 308.86203, "r_y3": 473.32904, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06104, "r_y0": 482.14594, "r_x1": 545.11267, "r_y1": 482.14594, "r_x2": 545.11267, "r_y2": 473.23938, "r_x3": 367.06104, "r_y3": 473.23938, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 494.10092, "r_x1": 545.11511, "r_y1": 494.10092, "r_x2": 545.11511, "r_y2": 485.19437, "r_x3": 308.86203, "r_y3": 485.19437, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 506.05591, "r_x1": 545.11523, "r_y1": 506.05591, "r_x2": 545.11523, "r_y2": 497.14935, "r_x3": 308.86203, "r_y3": 497.14935, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 518.0119, "r_x1": 545.11511, "r_y1": 518.0119, "r_x2": 545.11511, "r_y2": 509.10535, "r_x3": 308.86203, "r_y3": 509.10535, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 529.9668899999999, "r_x1": 545.11517, "r_y1": 529.9668899999999, "r_x2": 545.11517, "r_y2": 521.06033, "r_x3": 308.86203, "r_y3": 521.06033, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 541.9218900000001, "r_x1": 545.11517, "r_y1": 541.9218900000001, "r_x2": 545.11517, "r_y2": 533.01532, "r_x3": 308.86203, "r_y3": 533.01532, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 553.87689, "r_x1": 377.21548, "r_y1": 553.87689, "r_x2": 377.21548, "r_y2": 544.97034, "r_x3": 308.86203, "r_y3": 544.97034, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 589.40637, "r_x1": 323.9046, "r_y1": 589.40637, "r_x2": 323.9046, "r_y2": 579.55432, "r_x3": 308.86203, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93301, "r_y0": 589.40637, "r_x1": 397.44281, "r_y1": 589.40637, "r_x2": 397.44281, "r_y2": 579.55432, "r_x3": 333.93301, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 612.3558800000001, "r_x1": 545.11493, "r_y1": 612.3558800000001, "r_x2": 545.11493, "r_y2": 603.44933, "r_x3": 320.81702, "r_y3": 603.44933, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 624.31088, "r_x1": 545.11511, "r_y1": 624.31088, "r_x2": 545.11511, "r_y2": 615.40433, "r_x3": 308.86203, "r_y3": 615.40433, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 636.26588, "r_x1": 545.11517, "r_y1": 636.26588, "r_x2": 545.11517, "r_y2": 627.35933, "r_x3": 308.86203, "r_y3": 627.35933, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 648.22089, "r_x1": 545.11511, "r_y1": 648.22089, "r_x2": 545.11511, "r_y2": 639.31433, "r_x3": 308.86203, "r_y3": 639.31433, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 660.17688, "r_x1": 545.11517, "r_y1": 660.17688, "r_x2": 545.11517, "r_y2": 651.27032, "r_x3": 308.86203, "r_y3": 651.27032, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 672.13189, "r_x1": 350.70493, "r_y1": 672.13189, "r_x2": 350.70493, "r_y2": 663.22533, "r_x3": 308.86203, "r_y3": 663.22533, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 689.24189, "r_x1": 545.11505, "r_y1": 689.24189, "r_x2": 545.11505, "r_y2": 680.33533, "r_x3": 320.81702, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 701.196892, "r_x1": 396.21411, "r_y1": 701.196892, "r_x2": 396.21411, "r_y2": 692.290329, "r_x3": 308.86203, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.40585, "r_y0": 701.196892, "r_x1": 545.11523, "r_y1": 701.196892, "r_x2": 545.11523, "r_y2": 692.290329, "r_x3": 406.40585, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 713.152893, "r_x1": 495.93982, "r_y1": 713.152893, "r_x2": 495.93982, "r_y2": 704.246323, "r_x3": 308.86203, "r_y3": 704.246323, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.03989, "r_x1": 300.10233, "r_y1": 743.03989, "r_x2": 300.10233, "r_y2": 734.133327, "r_x3": 295.12103, "r_y3": 734.133327, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36514, "b": 155.84600999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9868090152740479, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36514, "r_y1": 84.11492999999996, "r_x2": 286.36514, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 286.36508, "r_y1": 96.06994999999995, "r_x2": 286.36508, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 286.36508, "r_y1": 108.02495999999985, "r_x2": 286.36508, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 119.97997999999984, "r_x1": 286.36508, "r_y1": 119.97997999999984, "r_x2": 286.36508, "r_y2": 111.07343000000003, "r_x3": 50.112, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.93499999999995, "r_x1": 286.36508, "r_y1": 131.93499999999995, "r_x2": 286.36508, "r_y2": 123.02844000000005, "r_x3": 50.112, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.89099, "r_x1": 286.36514, "r_y1": 143.89099, "r_x2": 286.36514, "r_y2": 134.98443999999995, "r_x3": 50.112, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.84600999999998, "r_x1": 175.16254, "r_y1": 155.84600999999998, "r_x2": 175.16254, "r_y2": 146.93944999999997, "r_x3": 50.112, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 50.112, "t": 159.62445000000002, "r": 286.36511, "b": 240.26306, "coord_origin": "TOPLEFT" }, "confidence": 0.9860327839851379, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 168.53101000000004, "r_x1": 286.36496, "r_y1": 168.53101000000004, "r_x2": 286.36496, "r_y2": 159.62445000000002, "r_x3": 62.067001, "r_y3": 159.62445000000002, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.48699999999997, "r_x1": 286.36511, "r_y1": 180.48699999999997, "r_x2": 286.36511, "r_y2": 171.58043999999995, "r_x3": 50.112, "r_y3": 171.58043999999995, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.44201999999996, "r_x1": 286.36511, "r_y1": 192.44201999999996, "r_x2": 286.36511, "r_y2": 183.53545999999994, "r_x3": 50.112, "r_y3": 183.53545999999994, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.39702999999997, "r_x1": 286.36511, "r_y1": 204.39702999999997, "r_x2": 286.36511, "r_y2": 195.49048000000005, "r_x3": 50.112, "r_y3": 195.49048000000005, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.35204999999996, "r_x1": 286.36511, "r_y1": 216.35204999999996, "r_x2": 286.36511, "r_y2": 207.44550000000004, "r_x3": 50.112, "r_y3": 207.44550000000004, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.30706999999995, "r_x1": 286.36511, "r_y1": 228.30706999999995, "r_x2": 286.36511, "r_y2": 219.40051000000005, "r_x3": 50.112, "r_y3": 219.40051000000005, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 240.26306, "r_x1": 181.54855, "r_y1": 240.26306, "r_x2": 181.54855, "r_y2": 231.35650999999996, "r_x3": 50.112, "r_y3": 231.35650999999996, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 243.92193999999995, "r": 286.36572, "b": 444.2309, "coord_origin": "TOPLEFT" }, "confidence": 0.9873637557029724, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.87829999999997, "r_x1": 129.21492, "r_y1": 252.87829999999997, "r_x2": 129.21492, "r_y2": 243.92193999999995, "r_x3": 62.067001, "r_y3": 243.92193999999995, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.451, "r_y0": 252.94806000000005, "r_x1": 286.36078, "r_y1": 252.94806000000005, "r_x2": 286.36078, "r_y2": 244.04150000000004, "r_x3": 134.451, "r_y3": 244.04150000000004, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 264.90308000000005, "r_x1": 286.36511, "r_y1": 264.90308000000005, "r_x2": 286.36511, "r_y2": 255.99652000000003, "r_x3": 50.112007, "r_y3": 255.99652000000003, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 276.63989000000004, "r_x1": 56.84528, "r_y1": 276.63989000000004, "r_x2": 56.84528, "r_y2": 267.79309, "r_x3": 50.112007, "r_y3": 267.79309, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.343006, "r_y0": 276.85907, "r_x1": 135.39996, "r_y1": 276.85907, "r_x2": 135.39996, "r_y2": 267.95250999999996, "r_x3": 57.343006, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.735, "r_y0": 276.62994000000003, "r_x1": 211.07965, "r_y1": 276.62994000000003, "r_x2": 211.07965, "r_y2": 268.04218000000003, "r_x3": 137.735, "r_y3": 268.04218000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.63699, "r_y0": 276.85907, "r_x1": 286.36395, "r_y1": 276.85907, "r_x2": 286.36395, "r_y2": 267.95250999999996, "r_x3": 213.63699, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.81406, "r_x1": 158.82388, "r_y1": 288.81406, "r_x2": 158.82388, "r_y2": 279.90747, "r_x3": 50.112, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.31799, "r_y0": 288.58493, "r_x1": 238.79712, "r_y1": 288.58493, "r_x2": 238.79712, "r_y2": 279.99712999999997, "r_x3": 161.31799, "r_y3": 279.99712999999997, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.521, "r_y0": 288.81406, "r_x1": 286.36264, "r_y1": 288.81406, "r_x2": 286.36264, "r_y2": 279.90747, "r_x3": 241.521, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.76904, "r_x1": 211.3766, "r_y1": 300.76904, "r_x2": 211.3766, "r_y2": 291.86249, "r_x3": 50.112, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.271, "r_y0": 300.54987, "r_x1": 229.19780000000003, "r_y1": 300.54987, "r_x2": 229.19780000000003, "r_y2": 291.70309, "r_x3": 214.271, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.696, "r_y0": 300.76904, "r_x1": 232.18665000000001, "r_y1": 300.76904, "r_x2": 232.18665000000001, "r_y2": 291.86249, "r_x3": 229.696, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49001, "r_y0": 300.54987, "r_x1": 251.41681000000003, "r_y1": 300.54987, "r_x2": 251.41681000000003, "r_y2": 291.70309, "r_x3": 236.49001, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81099999999998, "r_y0": 300.76904, "r_x1": 286.36255, "r_y1": 300.76904, "r_x2": 286.36255, "r_y2": 291.86249, "r_x3": 254.81099999999998, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.72403, "r_x1": 137.45412, "r_y1": 312.72403, "r_x2": 137.45412, "r_y2": 303.81747, "r_x3": 50.112, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.298, "r_y0": 312.50485, "r_x1": 148.24258, "r_y1": 312.50485, "r_x2": 148.24258, "r_y2": 303.65808, "r_x3": 141.298, "r_y3": 303.65808, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.58601, "r_y0": 312.72403, "r_x1": 286.36377, "r_y1": 312.72403, "r_x2": 286.36377, "r_y2": 303.81747, "r_x3": 152.58601, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 324.67902, "r_x1": 89.683464, "r_y1": 324.67902, "r_x2": 89.683464, "r_y2": 315.77245999999997, "r_x3": 50.112015, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.68602, "r_y0": 324.45984, "r_x1": 104.12046, "r_y1": 324.45984, "r_x2": 104.12046, "r_y2": 315.61307, "r_x3": 89.68602, "r_y3": 315.61307, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.61802, "r_y0": 324.67902, "r_x1": 286.36572, "r_y1": 324.67902, "r_x2": 286.36572, "r_y2": 315.77245999999997, "r_x3": 104.61802, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 336.6350100000001, "r_x1": 286.36511, "r_y1": 336.6350100000001, "r_x2": 286.36511, "r_y2": 327.72845, "r_x3": 50.112019, "r_y3": 327.72845, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 348.59, "r_x1": 286.36508, "r_y1": 348.59, "r_x2": 286.36508, "r_y2": 339.68344, "r_x3": 50.112019, "r_y3": 339.68344, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 360.54498, "r_x1": 286.36511, "r_y1": 360.54498, "r_x2": 286.36511, "r_y2": 351.63843, "r_x3": 50.112019, "r_y3": 351.63843, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 372.49996999999996, "r_x1": 286.36508, "r_y1": 372.49996999999996, "r_x2": 286.36508, "r_y2": 363.59341, "r_x3": 50.112019, "r_y3": 363.59341, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 384.45496, "r_x1": 286.36511, "r_y1": 384.45496, "r_x2": 286.36511, "r_y2": 375.5484, "r_x3": 50.112019, "r_y3": 375.5484, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 396.40994, "r_x1": 286.36514, "r_y1": 396.40994, "r_x2": 286.36514, "r_y2": 387.50339, "r_x3": 50.112019, "r_y3": 387.50339, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 408.36594, "r_x1": 88.68721, "r_y1": 408.36594, "r_x2": 88.68721, "r_y2": 399.45938, "r_x3": 50.112019, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.646019, "r_y0": 408.13681, "r_x1": 170.0517, "r_y1": 408.13681, "r_x2": 170.0517, "r_y2": 399.54904, "r_x3": 91.646019, "r_y3": 399.54904, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05103, "r_y0": 408.36594, "r_x1": 286.36438, "r_y1": 408.36594, "r_x2": 286.36438, "r_y2": 399.45938, "r_x3": 170.05103, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 420.32092, "r_x1": 181.96703, "r_y1": 420.32092, "r_x2": 181.96703, "r_y2": 411.41437, "r_x3": 50.112022, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09029, "r_y0": 420.32092, "r_x1": 197.74918, "r_y1": 420.32092, "r_x2": 197.74918, "r_y2": 411.41437, "r_x3": 189.09029, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.34789, "r_y0": 420.32092, "r_x1": 286.36511, "r_y1": 420.32092, "r_x2": 286.36511, "r_y2": 411.41437, "r_x3": 200.34789, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 432.27591, "r_x1": 286.36511, "r_y1": 432.27591, "r_x2": 286.36511, "r_y2": 423.36934999999994, "r_x3": 50.112022, "r_y3": 423.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 444.2309, "r_x1": 158.2959, "r_y1": 444.2309, "r_x2": 158.2959, "r_y2": 435.32434, "r_x3": 50.112022, "r_y3": 435.32434, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 50.112022, "t": 448.01035, "r": 286.36499, "b": 468.87189, "coord_origin": "TOPLEFT" }, "confidence": 0.9724196195602417, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067024, "r_y0": 456.9169, "r_x1": 286.36499, "r_y1": 456.9169, "r_x2": 286.36499, "r_y2": 448.01035, "r_x3": 62.067024, "r_y3": 448.01035, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 468.87189, "r_x1": 91.377113, "r_y1": 468.87189, "r_x2": 91.377113, "r_y2": 459.96533, "r_x3": 50.112022, "r_y3": 459.96533, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "formula", "bbox": { "l": 124.33002, "t": 493.28094, "r": 286.36243, "b": 517.07172, "coord_origin": "TOPLEFT" }, "confidence": 0.9423348307609558, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.71502, "r_y0": 502.12772, "r_x1": 140.64182, "r_y1": 502.12772, "r_x2": 140.64182, "r_y2": 493.28094, "r_x3": 125.71502, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.90701, "r_y0": 502.12772, "r_x1": 151.65593, "r_y1": 502.12772, "r_x2": 151.65593, "r_y2": 493.28094, "r_x3": 143.90701, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42302, "r_y0": 502.12772, "r_x1": 186.62846, "r_y1": 502.12772, "r_x2": 186.62846, "r_y2": 493.28094, "r_x3": 154.42302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34003, "r_y0": 502.12772, "r_x1": 197.08894, "r_y1": 502.12772, "r_x2": 197.08894, "r_y2": 493.28094, "r_x3": 189.34003, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.30302, "r_y0": 502.12772, "r_x1": 211.64659, "r_y1": 502.12772, "r_x2": 211.64659, "r_y2": 493.28094, "r_x3": 199.30302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33002, "r_y0": 517.07172, "r_x1": 127.30286, "r_y1": 517.07172, "r_x2": 127.30286, "r_y2": 508.22495, "r_x3": 124.33002, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.26602, "r_y0": 517.07172, "r_x1": 138.01494, "r_y1": 517.07172, "r_x2": 138.01494, "r_y2": 508.22495, "r_x3": 130.26602, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78203, "r_y0": 517.07172, "r_x1": 153.32629, "r_y1": 517.07172, "r_x2": 153.32629, "r_y2": 508.22495, "r_x3": 140.78203, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.03903, "r_y0": 517.07172, "r_x1": 174.85541, "r_y1": 517.07172, "r_x2": 174.85541, "r_y2": 508.22495, "r_x3": 156.03903, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07103, "r_y0": 517.07172, "r_x1": 184.81995, "r_y1": 517.07172, "r_x2": 184.81995, "r_y2": 507.66702, "r_x3": 177.07103, "r_y3": 507.66702, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03304, "r_y0": 517.07172, "r_x1": 192.84422, "r_y1": 517.07172, "r_x2": 192.84422, "r_y2": 508.22495, "r_x3": 187.03304, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.84503, "r_y0": 517.07172, "r_x1": 196.71948, "r_y1": 517.07172, "r_x2": 196.71948, "r_y2": 508.22495, "r_x3": 192.84503, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.71902, "r_y0": 517.07172, "r_x1": 211.64583, "r_y1": 517.07172, "r_x2": 211.64583, "r_y2": 508.22495, "r_x3": 196.71902, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74603, "r_y0": 509.91788, "r_x1": 286.36243, "r_y1": 509.91788, "r_x2": 286.36243, "r_y2": 501.01132, "r_x3": 274.74603, "r_y3": 501.01132, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 50.11203, "t": 530.5920100000001, "r": 281.59692, "b": 540.21588, "coord_origin": "TOPLEFT" }, "confidence": 0.9363929629325867, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 540.21588, "r_x1": 74.450661, "r_y1": 540.21588, "r_x2": 74.450661, "r_y2": 531.30933, "r_x3": 50.11203, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.941032, "r_y0": 539.9967, "r_x1": 82.75222, "r_y1": 539.9967, "r_x2": 82.75222, "r_y2": 531.14993, "r_x3": 76.941032, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.520035, "r_y0": 539.9967, "r_x1": 92.162102, "r_y1": 539.9967, "r_x2": 92.162102, "r_y2": 530.5920100000001, "r_x3": 85.520035, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.653038, "r_y0": 540.21588, "r_x1": 135.59932, "r_y1": 540.21588, "r_x2": 135.59932, "r_y2": 531.30933, "r_x3": 94.653038, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09004, "r_y0": 539.9967, "r_x1": 172.63162, "r_y1": 539.9967, "r_x2": 172.63162, "r_y2": 531.14993, "r_x3": 138.09004, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.89705, "r_y0": 539.9967, "r_x1": 192.50104, "r_y1": 539.9967, "r_x2": 192.50104, "r_y2": 530.5920100000001, "r_x3": 175.89705, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99205, "r_y0": 540.21588, "r_x1": 281.59692, "r_y1": 540.21588, "r_x2": 281.59692, "r_y2": 531.30933, "r_x3": 194.99205, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "section_header", "bbox": { "l": 50.112045, "t": 555.91689, "r": 171.98335, "b": 566.66461, "coord_origin": "TOPLEFT" }, "confidence": 0.9554555416107178, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 566.66461, "r_x1": 57.92831799999999, "r_y1": 566.66461, "r_x2": 57.92831799999999, "r_y2": 555.91689, "r_x3": 50.112045, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.350014, "r_y0": 566.66461, "r_x1": 171.98335, "r_y1": 566.66461, "r_x2": 171.98335, "r_y2": 555.91689, "r_x3": 68.350014, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 50.112045, "t": 576.26433, "r": 179.17502, "b": 586.1163799999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9538503289222717, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 586.1163799999999, "r_x1": 64.693237, "r_y1": 586.1163799999999, "r_x2": 64.693237, "r_y2": 576.26433, "r_x3": 50.112045, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.414032, "r_y0": 586.1163799999999, "r_x1": 179.17502, "r_y1": 586.1163799999999, "r_x2": 179.17502, "r_y2": 576.26433, "r_x3": 74.414032, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 50.112045, "t": 595.73433, "r": 286.36517, "b": 640.50688, "coord_origin": "TOPLEFT" }, "confidence": 0.9856163263320923, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067047, "r_y0": 604.64088, "r_x1": 202.97806, "r_y1": 604.64088, "r_x2": 202.97806, "r_y2": 595.73433, "r_x3": 62.067047, "r_y3": 595.73433, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38405, "r_y0": 604.41174, "r_x1": 286.36008, "r_y1": 604.41174, "r_x2": 286.36008, "r_y2": 595.82399, "r_x3": 205.38405, "r_y3": 595.82399, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 616.3667399999999, "r_x1": 70.037247, "r_y1": 616.3667399999999, "r_x2": 70.037247, "r_y2": 607.77899, "r_x3": 50.112045, "r_y3": 607.77899, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037048, "r_y0": 616.59589, "r_x1": 286.36496, "r_y1": 616.59589, "r_x2": 286.36496, "r_y2": 607.68933, "r_x3": 70.037048, "r_y3": 607.68933, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 628.55089, "r_x1": 286.36517, "r_y1": 628.55089, "r_x2": 286.36517, "r_y2": 619.64433, "r_x3": 50.112049, "r_y3": 619.64433, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 640.50688, "r_x1": 207.03294, "r_y1": 640.50688, "r_x2": 207.03294, "r_y2": 631.60033, "r_x3": 50.112049, "r_y3": 631.60033, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "formula", "bbox": { "l": 91.661049, "t": 653.828, "r": 286.36246, "b": 678.39588, "coord_origin": "TOPLEFT" }, "confidence": 0.844183623790741, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.661049, "r_y0": 663.45187, "r_x1": 186.01683, "r_y1": 663.45187, "r_x2": 186.01683, "r_y2": 654.54532, "r_x3": 91.661049, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.50705, "r_y0": 663.2327, "r_x1": 196.25597, "r_y1": 663.2327, "r_x2": 196.25597, "r_y2": 653.828, "r_x3": 188.50705, "r_y3": 653.828, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.74605, "r_y0": 663.45187, "r_x1": 244.81310999999997, "r_y1": 663.45187, "r_x2": 244.81310999999997, "r_y2": 654.54532, "r_x3": 198.74605, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.01604, "r_y0": 678.39588, "r_x1": 186.24606, "r_y1": 678.39588, "r_x2": 186.24606, "r_y2": 669.48932, "r_x3": 101.01604, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.73605, "r_y0": 678.1767, "r_x1": 196.48497, "r_y1": 678.1767, "r_x2": 196.48497, "r_y2": 668.77201, "r_x3": 188.73605, "r_y3": 668.77201, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.97505, "r_y0": 678.39588, "r_x1": 244.81296999999998, "r_y1": 678.39588, "r_x2": 244.81296999999998, "r_y2": 669.48932, "r_x3": 198.97505, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74606, "r_y0": 671.02388, "r_x1": 286.36246, "r_y1": 671.02388, "r_x2": 286.36246, "r_y2": 662.11731, "r_x3": 274.74606, "r_y3": 662.11731, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "text", "bbox": { "l": 50.112061, "t": 692.290314, "r": 286.36514, "b": 713.151878, "coord_origin": "TOPLEFT" }, "confidence": 0.9724979996681213, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 701.196877, "r_x1": 286.36514, "r_y1": 701.196877, "r_x2": 286.36514, "r_y2": 692.290314, "r_x3": 50.112061, "r_y3": 692.290314, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 713.151878, "r_x1": 286.36514, "r_y1": 713.151878, "r_x2": 286.36514, "r_y2": 704.245316, "r_x3": 50.112061, "r_y3": 704.245316, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 308.86206, "t": 75.20830999999998, "r": 545.11523, "b": 108.0249, "coord_origin": "TOPLEFT" }, "confidence": 0.9799237847328186, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 84.11487, "r_x1": 545.11523, "r_y1": 84.11487, "r_x2": 545.11523, "r_y2": 75.20830999999998, "r_x3": 308.86206, "r_y3": 75.20830999999998, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 96.06988999999999, "r_x1": 339.98523, "r_y1": 96.06988999999999, "r_x2": 339.98523, "r_y2": 87.16332999999997, "r_x3": 308.86206, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.88931, "r_y0": 96.06988999999999, "r_x1": 545.11523, "r_y1": 96.06988999999999, "r_x2": 545.11523, "r_y2": 87.16332999999997, "r_x3": 346.88931, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 108.0249, "r_x1": 492.96097, "r_y1": 108.0249, "r_x2": 492.96097, "r_y2": 99.11835000000008, "r_x3": 308.86206, "r_y3": 99.11835000000008, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.86206, "t": 116.22937000000002, "r": 545.1153, "b": 328.37405, "coord_origin": "TOPLEFT" }, "confidence": 0.9880930781364441, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 125.13593000000003, "r_x1": 545.11499, "r_y1": 125.13593000000003, "r_x2": 545.11499, "r_y2": 116.22937000000002, "r_x3": 320.81705, "r_y3": 116.22937000000002, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 137.09094000000005, "r_x1": 545.11517, "r_y1": 137.09094000000005, "r_x2": 545.11517, "r_y2": 128.18439, "r_x3": 308.86206, "r_y3": 128.18439, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 149.04596000000004, "r_x1": 545.11505, "r_y1": 149.04596000000004, "r_x2": 545.11505, "r_y2": 140.13940000000002, "r_x3": 308.86206, "r_y3": 140.13940000000002, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 161.00098000000003, "r_x1": 545.11511, "r_y1": 161.00098000000003, "r_x2": 545.11511, "r_y2": 152.09442, "r_x3": 308.86206, "r_y3": 152.09442, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 172.95599000000004, "r_x1": 545.11517, "r_y1": 172.95599000000004, "r_x2": 545.11517, "r_y2": 164.04944, "r_x3": 308.86206, "r_y3": 164.04944, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 184.91198999999995, "r_x1": 467.21756000000005, "r_y1": 184.91198999999995, "r_x2": 467.21756000000005, "r_y2": 176.00543000000005, "r_x3": 308.86206, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.43671, "r_y0": 184.91198999999995, "r_x1": 545.11511, "r_y1": 184.91198999999995, "r_x2": 545.11511, "r_y2": 176.00543000000005, "r_x3": 475.43671, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 196.86699999999996, "r_x1": 545.11511, "r_y1": 196.86699999999996, "r_x2": 545.11511, "r_y2": 187.96045000000004, "r_x3": 308.86206, "r_y3": 187.96045000000004, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 208.82201999999995, "r_x1": 545.11511, "r_y1": 208.82201999999995, "r_x2": 545.11511, "r_y2": 199.91547000000003, "r_x3": 308.86206, "r_y3": 199.91547000000003, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 220.77704000000006, "r_x1": 545.11517, "r_y1": 220.77704000000006, "r_x2": 545.11517, "r_y2": 211.87048000000004, "r_x3": 308.86206, "r_y3": 211.87048000000004, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 232.73206000000005, "r_x1": 545.11511, "r_y1": 232.73206000000005, "r_x2": 545.11511, "r_y2": 223.82550000000003, "r_x3": 308.86206, "r_y3": 223.82550000000003, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 244.68706999999995, "r_x1": 545.11511, "r_y1": 244.68706999999995, "r_x2": 545.11511, "r_y2": 235.78052000000002, "r_x3": 308.86206, "r_y3": 235.78052000000002, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 256.64306999999997, "r_x1": 545.11523, "r_y1": 256.64306999999997, "r_x2": 545.11523, "r_y2": 247.73650999999995, "r_x3": 308.86206, "r_y3": 247.73650999999995, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 268.59808, "r_x1": 342.3364, "r_y1": 268.59808, "r_x2": 342.3364, "r_y2": 259.69152999999994, "r_x3": 308.86206, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95157, "r_y0": 268.59808, "r_x1": 545.11517, "r_y1": 268.59808, "r_x2": 545.11517, "r_y2": 259.69152999999994, "r_x3": 348.95157, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 280.55310000000003, "r_x1": 545.11517, "r_y1": 280.55310000000003, "r_x2": 545.11517, "r_y2": 271.64655000000005, "r_x3": 308.86206, "r_y3": 271.64655000000005, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 292.50809, "r_x1": 545.1153, "r_y1": 292.50809, "r_x2": 545.1153, "r_y2": 283.6015300000001, "r_x3": 308.86206, "r_y3": 283.6015300000001, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 304.46307, "r_x1": 545.11511, "r_y1": 304.46307, "r_x2": 545.11511, "r_y2": 295.55652, "r_x3": 308.86206, "r_y3": 295.55652, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 316.41806, "r_x1": 545.11511, "r_y1": 316.41806, "r_x2": 545.11511, "r_y2": 307.51151, "r_x3": 308.86206, "r_y3": 307.51151, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 328.37405, "r_x1": 532.48267, "r_y1": 328.37405, "r_x2": 532.48267, "r_y2": 319.4674999999999, "r_x3": 308.86206, "r_y3": 319.4674999999999, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.86203, "t": 336.57751, "r": 545.11517, "b": 429.16998, "coord_origin": "TOPLEFT" }, "confidence": 0.9877589344978333, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 345.48407000000003, "r_x1": 545.11499, "r_y1": 345.48407000000003, "r_x2": 545.11499, "r_y2": 336.57751, "r_x3": 320.81705, "r_y3": 336.57751, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 357.43906, "r_x1": 403.7359, "r_y1": 357.43906, "r_x2": 403.7359, "r_y2": 348.5325000000001, "r_x3": 308.86206, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.07605, "r_y0": 357.20993, "r_x1": 503.54016, "r_y1": 357.20993, "r_x2": 503.54016, "r_y2": 348.62216, "r_x3": 406.07605, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.53906, "r_y0": 357.43906, "r_x1": 506.02972, "r_y1": 357.43906, "r_x2": 506.02972, "r_y2": 348.5325000000001, "r_x3": 503.53906, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.40004999999996, "r_y0": 357.20993, "r_x1": 545.11224, "r_y1": 357.20993, "r_x2": 545.11224, "r_y2": 348.62216, "r_x3": 508.40004999999996, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 369.16492000000005, "r_x1": 343.1633, "r_y1": 369.16492000000005, "r_x2": 343.1633, "r_y2": 360.57715, "r_x3": 308.86206, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16306, "r_y0": 369.39404, "r_x1": 362.2016, "r_y1": 369.39404, "r_x2": 362.2016, "r_y2": 360.48749, "r_x3": 343.16306, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.28604, "r_y0": 369.16492000000005, "r_x1": 440.93829, "r_y1": 369.16492000000005, "r_x2": 440.93829, "r_y2": 360.57715, "r_x3": 364.28604, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.93903, "r_y0": 369.39404, "r_x1": 545.10797, "r_y1": 369.39404, "r_x2": 545.10797, "r_y2": 360.48749, "r_x3": 440.93903, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 381.34903, "r_x1": 545.11511, "r_y1": 381.34903, "r_x2": 545.11511, "r_y2": 372.44247, "r_x3": 308.86203, "r_y3": 372.44247, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 393.30502, "r_x1": 545.11517, "r_y1": 393.30502, "r_x2": 545.11517, "r_y2": 384.3984699999999, "r_x3": 308.86203, "r_y3": 384.3984699999999, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 405.04083, "r_x1": 314.67322, "r_y1": 405.04083, "r_x2": 314.67322, "r_y2": 396.19406000000004, "r_x3": 308.86203, "r_y3": 396.19406000000004, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.65802, "r_y0": 405.2600100000001, "r_x1": 360.39139, "r_y1": 405.2600100000001, "r_x2": 360.39139, "r_y2": 396.35345, "r_x3": 318.65802, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96295, "r_y0": 405.2600100000001, "r_x1": 545.10803, "r_y1": 405.2600100000001, "r_x2": 545.10803, "r_y2": 396.35345, "r_x3": 367.96295, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 417.215, "r_x1": 545.11511, "r_y1": 417.215, "r_x2": 545.11511, "r_y2": 408.30844, "r_x3": 308.86203, "r_y3": 408.30844, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 429.16998, "r_x1": 360.9664, "r_y1": 429.16998, "r_x2": 360.9664, "r_y2": 420.26343, "r_x3": 308.86203, "r_y3": 420.26343, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86203, "t": 437.37441999999993, "r": 545.11523, "b": 553.87689, "coord_origin": "TOPLEFT" }, "confidence": 0.9884491562843323, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 446.28098, "r_x1": 545.11499, "r_y1": 446.28098, "r_x2": 545.11499, "r_y2": 437.37441999999993, "r_x3": 320.81702, "r_y3": 437.37441999999993, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 458.23596, "r_x1": 384.62759, "r_y1": 458.23596, "r_x2": 384.62759, "r_y2": 449.32941, "r_x3": 308.86203, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37228, "r_y0": 458.23596, "r_x1": 545.11511, "r_y1": 458.23596, "r_x2": 545.11511, "r_y2": 449.32941, "r_x3": 391.37228, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 470.19095, "r_x1": 494.00693000000007, "r_y1": 470.19095, "r_x2": 494.00693000000007, "r_y2": 461.28439, "r_x3": 308.86203, "r_y3": 461.28439, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.07803, "r_y0": 469.96182, "r_x1": 545.11145, "r_y1": 469.96182, "r_x2": 545.11145, "r_y2": 461.37405, "r_x3": 498.07803, "r_y3": 461.37405, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 481.91681, "r_x1": 364.44336, "r_y1": 481.91681, "r_x2": 364.44336, "r_y2": 473.32904, "r_x3": 308.86203, "r_y3": 473.32904, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06104, "r_y0": 482.14594, "r_x1": 545.11267, "r_y1": 482.14594, "r_x2": 545.11267, "r_y2": 473.23938, "r_x3": 367.06104, "r_y3": 473.23938, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 494.10092, "r_x1": 545.11511, "r_y1": 494.10092, "r_x2": 545.11511, "r_y2": 485.19437, "r_x3": 308.86203, "r_y3": 485.19437, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 506.05591, "r_x1": 545.11523, "r_y1": 506.05591, "r_x2": 545.11523, "r_y2": 497.14935, "r_x3": 308.86203, "r_y3": 497.14935, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 518.0119, "r_x1": 545.11511, "r_y1": 518.0119, "r_x2": 545.11511, "r_y2": 509.10535, "r_x3": 308.86203, "r_y3": 509.10535, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 529.9668899999999, "r_x1": 545.11517, "r_y1": 529.9668899999999, "r_x2": 545.11517, "r_y2": 521.06033, "r_x3": 308.86203, "r_y3": 521.06033, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 541.9218900000001, "r_x1": 545.11517, "r_y1": 541.9218900000001, "r_x2": 545.11517, "r_y2": 533.01532, "r_x3": 308.86203, "r_y3": 533.01532, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 553.87689, "r_x1": 377.21548, "r_y1": 553.87689, "r_x2": 377.21548, "r_y2": 544.97034, "r_x3": 308.86203, "r_y3": 544.97034, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "section_header", "bbox": { "l": 308.86203, "t": 579.55432, "r": 397.44281, "b": 589.40637, "coord_origin": "TOPLEFT" }, "confidence": 0.9450808763504028, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 589.40637, "r_x1": 323.9046, "r_y1": 589.40637, "r_x2": 323.9046, "r_y2": 579.55432, "r_x3": 308.86203, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93301, "r_y0": 589.40637, "r_x1": 397.44281, "r_y1": 589.40637, "r_x2": 397.44281, "r_y2": 579.55432, "r_x3": 333.93301, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.86203, "t": 603.44933, "r": 545.11517, "b": 672.13189, "coord_origin": "TOPLEFT" }, "confidence": 0.9880595803260803, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 612.3558800000001, "r_x1": 545.11493, "r_y1": 612.3558800000001, "r_x2": 545.11493, "r_y2": 603.44933, "r_x3": 320.81702, "r_y3": 603.44933, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 624.31088, "r_x1": 545.11511, "r_y1": 624.31088, "r_x2": 545.11511, "r_y2": 615.40433, "r_x3": 308.86203, "r_y3": 615.40433, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 636.26588, "r_x1": 545.11517, "r_y1": 636.26588, "r_x2": 545.11517, "r_y2": 627.35933, "r_x3": 308.86203, "r_y3": 627.35933, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 648.22089, "r_x1": 545.11511, "r_y1": 648.22089, "r_x2": 545.11511, "r_y2": 639.31433, "r_x3": 308.86203, "r_y3": 639.31433, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 660.17688, "r_x1": 545.11517, "r_y1": 660.17688, "r_x2": 545.11517, "r_y2": 651.27032, "r_x3": 308.86203, "r_y3": 651.27032, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 672.13189, "r_x1": 350.70493, "r_y1": 672.13189, "r_x2": 350.70493, "r_y2": 663.22533, "r_x3": 308.86203, "r_y3": 663.22533, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 308.86203, "t": 680.33533, "r": 545.11523, "b": 713.152893, "coord_origin": "TOPLEFT" }, "confidence": 0.9830910563468933, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 689.24189, "r_x1": 545.11505, "r_y1": 689.24189, "r_x2": 545.11505, "r_y2": 680.33533, "r_x3": 320.81702, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 701.196892, "r_x1": 396.21411, "r_y1": 701.196892, "r_x2": 396.21411, "r_y2": 692.290329, "r_x3": 308.86203, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.40585, "r_y0": 701.196892, "r_x1": 545.11523, "r_y1": 701.196892, "r_x2": 545.11523, "r_y2": 692.290329, "r_x3": 406.40585, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 713.152893, "r_x1": 495.93982, "r_y1": 713.152893, "r_x2": 495.93982, "r_y2": 704.246323, "r_x3": 308.86203, "r_y3": 704.246323, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "page_footer", "bbox": { "l": 295.12103, "t": 734.133327, "r": 300.10233, "b": 743.03989, "coord_origin": "TOPLEFT" }, "confidence": 0.8820409178733826, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.03989, "r_x1": 300.10233, "r_y1": 743.03989, "r_x2": 300.10233, "r_y2": 734.133327, "r_x3": 295.12103, "r_y3": 734.133327, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36514, "b": 155.84600999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9868090152740479, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36514, "r_y1": 84.11492999999996, "r_x2": 286.36514, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 286.36508, "r_y1": 96.06994999999995, "r_x2": 286.36508, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 286.36508, "r_y1": 108.02495999999985, "r_x2": 286.36508, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 119.97997999999984, "r_x1": 286.36508, "r_y1": 119.97997999999984, "r_x2": 286.36508, "r_y2": 111.07343000000003, "r_x3": 50.112, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.93499999999995, "r_x1": 286.36508, "r_y1": 131.93499999999995, "r_x2": 286.36508, "r_y2": 123.02844000000005, "r_x3": 50.112, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.89099, "r_x1": 286.36514, "r_y1": 143.89099, "r_x2": 286.36514, "r_y2": 134.98443999999995, "r_x3": 50.112, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.84600999999998, "r_x1": 175.16254, "r_y1": 155.84600999999998, "r_x2": 175.16254, "r_y2": 146.93944999999997, "r_x3": 50.112, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.112, "t": 159.62445000000002, "r": 286.36511, "b": 240.26306, "coord_origin": "TOPLEFT" }, "confidence": 0.9860327839851379, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 168.53101000000004, "r_x1": 286.36496, "r_y1": 168.53101000000004, "r_x2": 286.36496, "r_y2": 159.62445000000002, "r_x3": 62.067001, "r_y3": 159.62445000000002, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.48699999999997, "r_x1": 286.36511, "r_y1": 180.48699999999997, "r_x2": 286.36511, "r_y2": 171.58043999999995, "r_x3": 50.112, "r_y3": 171.58043999999995, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.44201999999996, "r_x1": 286.36511, "r_y1": 192.44201999999996, "r_x2": 286.36511, "r_y2": 183.53545999999994, "r_x3": 50.112, "r_y3": 183.53545999999994, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.39702999999997, "r_x1": 286.36511, "r_y1": 204.39702999999997, "r_x2": 286.36511, "r_y2": 195.49048000000005, "r_x3": 50.112, "r_y3": 195.49048000000005, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.35204999999996, "r_x1": 286.36511, "r_y1": 216.35204999999996, "r_x2": 286.36511, "r_y2": 207.44550000000004, "r_x3": 50.112, "r_y3": 207.44550000000004, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.30706999999995, "r_x1": 286.36511, "r_y1": 228.30706999999995, "r_x2": 286.36511, "r_y2": 219.40051000000005, "r_x3": 50.112, "r_y3": 219.40051000000005, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 240.26306, "r_x1": 181.54855, "r_y1": 240.26306, "r_x2": 181.54855, "r_y2": 231.35650999999996, "r_x3": 50.112, "r_y3": 231.35650999999996, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer." }, { "label": "text", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 243.92193999999995, "r": 286.36572, "b": 444.2309, "coord_origin": "TOPLEFT" }, "confidence": 0.9873637557029724, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.87829999999997, "r_x1": 129.21492, "r_y1": 252.87829999999997, "r_x2": 129.21492, "r_y2": 243.92193999999995, "r_x3": 62.067001, "r_y3": 243.92193999999995, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.451, "r_y0": 252.94806000000005, "r_x1": 286.36078, "r_y1": 252.94806000000005, "r_x2": 286.36078, "r_y2": 244.04150000000004, "r_x3": 134.451, "r_y3": 244.04150000000004, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 264.90308000000005, "r_x1": 286.36511, "r_y1": 264.90308000000005, "r_x2": 286.36511, "r_y2": 255.99652000000003, "r_x3": 50.112007, "r_y3": 255.99652000000003, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 276.63989000000004, "r_x1": 56.84528, "r_y1": 276.63989000000004, "r_x2": 56.84528, "r_y2": 267.79309, "r_x3": 50.112007, "r_y3": 267.79309, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.343006, "r_y0": 276.85907, "r_x1": 135.39996, "r_y1": 276.85907, "r_x2": 135.39996, "r_y2": 267.95250999999996, "r_x3": 57.343006, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.735, "r_y0": 276.62994000000003, "r_x1": 211.07965, "r_y1": 276.62994000000003, "r_x2": 211.07965, "r_y2": 268.04218000000003, "r_x3": 137.735, "r_y3": 268.04218000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.63699, "r_y0": 276.85907, "r_x1": 286.36395, "r_y1": 276.85907, "r_x2": 286.36395, "r_y2": 267.95250999999996, "r_x3": 213.63699, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.81406, "r_x1": 158.82388, "r_y1": 288.81406, "r_x2": 158.82388, "r_y2": 279.90747, "r_x3": 50.112, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.31799, "r_y0": 288.58493, "r_x1": 238.79712, "r_y1": 288.58493, "r_x2": 238.79712, "r_y2": 279.99712999999997, "r_x3": 161.31799, "r_y3": 279.99712999999997, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.521, "r_y0": 288.81406, "r_x1": 286.36264, "r_y1": 288.81406, "r_x2": 286.36264, "r_y2": 279.90747, "r_x3": 241.521, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.76904, "r_x1": 211.3766, "r_y1": 300.76904, "r_x2": 211.3766, "r_y2": 291.86249, "r_x3": 50.112, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.271, "r_y0": 300.54987, "r_x1": 229.19780000000003, "r_y1": 300.54987, "r_x2": 229.19780000000003, "r_y2": 291.70309, "r_x3": 214.271, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.696, "r_y0": 300.76904, "r_x1": 232.18665000000001, "r_y1": 300.76904, "r_x2": 232.18665000000001, "r_y2": 291.86249, "r_x3": 229.696, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49001, "r_y0": 300.54987, "r_x1": 251.41681000000003, "r_y1": 300.54987, "r_x2": 251.41681000000003, "r_y2": 291.70309, "r_x3": 236.49001, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81099999999998, "r_y0": 300.76904, "r_x1": 286.36255, "r_y1": 300.76904, "r_x2": 286.36255, "r_y2": 291.86249, "r_x3": 254.81099999999998, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.72403, "r_x1": 137.45412, "r_y1": 312.72403, "r_x2": 137.45412, "r_y2": 303.81747, "r_x3": 50.112, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.298, "r_y0": 312.50485, "r_x1": 148.24258, "r_y1": 312.50485, "r_x2": 148.24258, "r_y2": 303.65808, "r_x3": 141.298, "r_y3": 303.65808, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.58601, "r_y0": 312.72403, "r_x1": 286.36377, "r_y1": 312.72403, "r_x2": 286.36377, "r_y2": 303.81747, "r_x3": 152.58601, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 324.67902, "r_x1": 89.683464, "r_y1": 324.67902, "r_x2": 89.683464, "r_y2": 315.77245999999997, "r_x3": 50.112015, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.68602, "r_y0": 324.45984, "r_x1": 104.12046, "r_y1": 324.45984, "r_x2": 104.12046, "r_y2": 315.61307, "r_x3": 89.68602, "r_y3": 315.61307, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.61802, "r_y0": 324.67902, "r_x1": 286.36572, "r_y1": 324.67902, "r_x2": 286.36572, "r_y2": 315.77245999999997, "r_x3": 104.61802, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 336.6350100000001, "r_x1": 286.36511, "r_y1": 336.6350100000001, "r_x2": 286.36511, "r_y2": 327.72845, "r_x3": 50.112019, "r_y3": 327.72845, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 348.59, "r_x1": 286.36508, "r_y1": 348.59, "r_x2": 286.36508, "r_y2": 339.68344, "r_x3": 50.112019, "r_y3": 339.68344, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 360.54498, "r_x1": 286.36511, "r_y1": 360.54498, "r_x2": 286.36511, "r_y2": 351.63843, "r_x3": 50.112019, "r_y3": 351.63843, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 372.49996999999996, "r_x1": 286.36508, "r_y1": 372.49996999999996, "r_x2": 286.36508, "r_y2": 363.59341, "r_x3": 50.112019, "r_y3": 363.59341, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 384.45496, "r_x1": 286.36511, "r_y1": 384.45496, "r_x2": 286.36511, "r_y2": 375.5484, "r_x3": 50.112019, "r_y3": 375.5484, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 396.40994, "r_x1": 286.36514, "r_y1": 396.40994, "r_x2": 286.36514, "r_y2": 387.50339, "r_x3": 50.112019, "r_y3": 387.50339, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 408.36594, "r_x1": 88.68721, "r_y1": 408.36594, "r_x2": 88.68721, "r_y2": 399.45938, "r_x3": 50.112019, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.646019, "r_y0": 408.13681, "r_x1": 170.0517, "r_y1": 408.13681, "r_x2": 170.0517, "r_y2": 399.54904, "r_x3": 91.646019, "r_y3": 399.54904, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05103, "r_y0": 408.36594, "r_x1": 286.36438, "r_y1": 408.36594, "r_x2": 286.36438, "r_y2": 399.45938, "r_x3": 170.05103, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 420.32092, "r_x1": 181.96703, "r_y1": 420.32092, "r_x2": 181.96703, "r_y2": 411.41437, "r_x3": 50.112022, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09029, "r_y0": 420.32092, "r_x1": 197.74918, "r_y1": 420.32092, "r_x2": 197.74918, "r_y2": 411.41437, "r_x3": 189.09029, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.34789, "r_y0": 420.32092, "r_x1": 286.36511, "r_y1": 420.32092, "r_x2": 286.36511, "r_y2": 411.41437, "r_x3": 200.34789, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 432.27591, "r_x1": 286.36511, "r_y1": 432.27591, "r_x2": 286.36511, "r_y2": 423.36934999999994, "r_x3": 50.112022, "r_y3": 423.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 444.2309, "r_x1": 158.2959, "r_y1": 444.2309, "r_x2": 158.2959, "r_y2": 435.32434, "r_x3": 50.112022, "r_y3": 435.32434, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets." }, { "label": "text", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.112022, "t": 448.01035, "r": 286.36499, "b": 468.87189, "coord_origin": "TOPLEFT" }, "confidence": 0.9724196195602417, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067024, "r_y0": 456.9169, "r_x1": 286.36499, "r_y1": 456.9169, "r_x2": 286.36499, "r_y2": 448.01035, "r_x3": 62.067024, "r_y3": 448.01035, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 468.87189, "r_x1": 91.377113, "r_y1": 468.87189, "r_x2": 91.377113, "r_y2": 459.96533, "r_x3": 50.112022, "r_y3": 459.96533, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The loss used to train the TableFormer can be defined as following:" }, { "label": "formula", "id": 15, "page_no": 5, "cluster": { "id": 15, "label": "formula", "bbox": { "l": 124.33002, "t": 493.28094, "r": 286.36243, "b": 517.07172, "coord_origin": "TOPLEFT" }, "confidence": 0.9423348307609558, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.71502, "r_y0": 502.12772, "r_x1": 140.64182, "r_y1": 502.12772, "r_x2": 140.64182, "r_y2": 493.28094, "r_x3": 125.71502, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.90701, "r_y0": 502.12772, "r_x1": 151.65593, "r_y1": 502.12772, "r_x2": 151.65593, "r_y2": 493.28094, "r_x3": 143.90701, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42302, "r_y0": 502.12772, "r_x1": 186.62846, "r_y1": 502.12772, "r_x2": 186.62846, "r_y2": 493.28094, "r_x3": 154.42302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34003, "r_y0": 502.12772, "r_x1": 197.08894, "r_y1": 502.12772, "r_x2": 197.08894, "r_y2": 493.28094, "r_x3": 189.34003, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.30302, "r_y0": 502.12772, "r_x1": 211.64659, "r_y1": 502.12772, "r_x2": 211.64659, "r_y2": 493.28094, "r_x3": 199.30302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33002, "r_y0": 517.07172, "r_x1": 127.30286, "r_y1": 517.07172, "r_x2": 127.30286, "r_y2": 508.22495, "r_x3": 124.33002, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.26602, "r_y0": 517.07172, "r_x1": 138.01494, "r_y1": 517.07172, "r_x2": 138.01494, "r_y2": 508.22495, "r_x3": 130.26602, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78203, "r_y0": 517.07172, "r_x1": 153.32629, "r_y1": 517.07172, "r_x2": 153.32629, "r_y2": 508.22495, "r_x3": 140.78203, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.03903, "r_y0": 517.07172, "r_x1": 174.85541, "r_y1": 517.07172, "r_x2": 174.85541, "r_y2": 508.22495, "r_x3": 156.03903, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07103, "r_y0": 517.07172, "r_x1": 184.81995, "r_y1": 517.07172, "r_x2": 184.81995, "r_y2": 507.66702, "r_x3": 177.07103, "r_y3": 507.66702, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03304, "r_y0": 517.07172, "r_x1": 192.84422, "r_y1": 517.07172, "r_x2": 192.84422, "r_y2": 508.22495, "r_x3": 187.03304, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.84503, "r_y0": 517.07172, "r_x1": 196.71948, "r_y1": 517.07172, "r_x2": 196.71948, "r_y2": 508.22495, "r_x3": 192.84503, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.71902, "r_y0": 517.07172, "r_x1": 211.64583, "r_y1": 517.07172, "r_x2": 211.64583, "r_y2": 508.22495, "r_x3": 196.71902, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74603, "r_y0": 509.91788, "r_x1": 286.36243, "r_y1": 509.91788, "r_x2": 286.36243, "r_y2": 501.01132, "r_x3": 274.74603, "r_y3": 501.01132, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)" }, { "label": "text", "id": 16, "page_no": 5, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.11203, "t": 530.5920100000001, "r": 281.59692, "b": 540.21588, "coord_origin": "TOPLEFT" }, "confidence": 0.9363929629325867, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 540.21588, "r_x1": 74.450661, "r_y1": 540.21588, "r_x2": 74.450661, "r_y2": 531.30933, "r_x3": 50.11203, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.941032, "r_y0": 539.9967, "r_x1": 82.75222, "r_y1": 539.9967, "r_x2": 82.75222, "r_y2": 531.14993, "r_x3": 76.941032, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.520035, "r_y0": 539.9967, "r_x1": 92.162102, "r_y1": 539.9967, "r_x2": 92.162102, "r_y2": 530.5920100000001, "r_x3": 85.520035, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.653038, "r_y0": 540.21588, "r_x1": 135.59932, "r_y1": 540.21588, "r_x2": 135.59932, "r_y2": 531.30933, "r_x3": 94.653038, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09004, "r_y0": 539.9967, "r_x1": 172.63162, "r_y1": 539.9967, "r_x2": 172.63162, "r_y2": 531.14993, "r_x3": 138.09004, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.89705, "r_y0": 539.9967, "r_x1": 192.50104, "r_y1": 539.9967, "r_x2": 192.50104, "r_y2": 530.5920100000001, "r_x3": 175.89705, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99205, "r_y0": 540.21588, "r_x1": 281.59692, "r_y1": 540.21588, "r_x2": 281.59692, "r_y2": 531.30933, "r_x3": 194.99205, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters." }, { "label": "section_header", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.112045, "t": 555.91689, "r": 171.98335, "b": 566.66461, "coord_origin": "TOPLEFT" }, "confidence": 0.9554555416107178, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 566.66461, "r_x1": 57.92831799999999, "r_y1": 566.66461, "r_x2": 57.92831799999999, "r_y2": 555.91689, "r_x3": 50.112045, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.350014, "r_y0": 566.66461, "r_x1": 171.98335, "r_y1": 566.66461, "r_x2": 171.98335, "r_y2": 555.91689, "r_x3": 68.350014, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Experimental Results" }, { "label": "section_header", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.112045, "t": 576.26433, "r": 179.17502, "b": 586.1163799999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9538503289222717, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 586.1163799999999, "r_x1": 64.693237, "r_y1": 586.1163799999999, "r_x2": 64.693237, "r_y2": 576.26433, "r_x3": 50.112045, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.414032, "r_y0": 586.1163799999999, "r_x1": 179.17502, "r_y1": 586.1163799999999, "r_x2": 179.17502, "r_y2": 576.26433, "r_x3": 74.414032, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1. Implementation Details" }, { "label": "text", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.112045, "t": 595.73433, "r": 286.36517, "b": 640.50688, "coord_origin": "TOPLEFT" }, "confidence": 0.9856163263320923, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067047, "r_y0": 604.64088, "r_x1": 202.97806, "r_y1": 604.64088, "r_x2": 202.97806, "r_y2": 595.73433, "r_x3": 62.067047, "r_y3": 595.73433, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38405, "r_y0": 604.41174, "r_x1": 286.36008, "r_y1": 604.41174, "r_x2": 286.36008, "r_y2": 595.82399, "r_x3": 205.38405, "r_y3": 595.82399, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 616.3667399999999, "r_x1": 70.037247, "r_y1": 616.3667399999999, "r_x2": 70.037247, "r_y2": 607.77899, "r_x3": 50.112045, "r_y3": 607.77899, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037048, "r_y0": 616.59589, "r_x1": 286.36496, "r_y1": 616.59589, "r_x2": 286.36496, "r_y2": 607.68933, "r_x3": 70.037048, "r_y3": 607.68933, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 628.55089, "r_x1": 286.36517, "r_y1": 628.55089, "r_x2": 286.36517, "r_y2": 619.64433, "r_x3": 50.112049, "r_y3": 619.64433, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 640.50688, "r_x1": 207.03294, "r_y1": 640.50688, "r_x2": 207.03294, "r_y2": 631.60033, "r_x3": 50.112049, "r_y3": 631.60033, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:" }, { "label": "formula", "id": 18, "page_no": 5, "cluster": { "id": 18, "label": "formula", "bbox": { "l": 91.661049, "t": 653.828, "r": 286.36246, "b": 678.39588, "coord_origin": "TOPLEFT" }, "confidence": 0.844183623790741, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.661049, "r_y0": 663.45187, "r_x1": 186.01683, "r_y1": 663.45187, "r_x2": 186.01683, "r_y2": 654.54532, "r_x3": 91.661049, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.50705, "r_y0": 663.2327, "r_x1": 196.25597, "r_y1": 663.2327, "r_x2": 196.25597, "r_y2": 653.828, "r_x3": 188.50705, "r_y3": 653.828, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.74605, "r_y0": 663.45187, "r_x1": 244.81310999999997, "r_y1": 663.45187, "r_x2": 244.81310999999997, "r_y2": 654.54532, "r_x3": 198.74605, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.01604, "r_y0": 678.39588, "r_x1": 186.24606, "r_y1": 678.39588, "r_x2": 186.24606, "r_y2": 669.48932, "r_x3": 101.01604, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.73605, "r_y0": 678.1767, "r_x1": 196.48497, "r_y1": 678.1767, "r_x2": 196.48497, "r_y2": 668.77201, "r_x3": 188.73605, "r_y3": 668.77201, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.97505, "r_y0": 678.39588, "r_x1": 244.81296999999998, "r_y1": 678.39588, "r_x2": 244.81296999999998, "r_y2": 669.48932, "r_x3": 198.97505, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74606, "r_y0": 671.02388, "r_x1": 286.36246, "r_y1": 671.02388, "r_x2": 286.36246, "r_y2": 662.11731, "r_x3": 274.74606, "r_y3": 662.11731, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)" }, { "label": "text", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.112061, "t": 692.290314, "r": 286.36514, "b": 713.151878, "coord_origin": "TOPLEFT" }, "confidence": 0.9724979996681213, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 701.196877, "r_x1": 286.36514, "r_y1": 701.196877, "r_x2": 286.36514, "r_y2": 692.290314, "r_x3": 50.112061, "r_y3": 692.290314, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 713.151878, "r_x1": 286.36514, "r_y1": 713.151878, "r_x2": 286.36514, "r_y2": 704.245316, "r_x3": 50.112061, "r_y3": 704.245316, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved" }, { "label": "text", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.86206, "t": 75.20830999999998, "r": 545.11523, "b": 108.0249, "coord_origin": "TOPLEFT" }, "confidence": 0.9799237847328186, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 84.11487, "r_x1": 545.11523, "r_y1": 84.11487, "r_x2": 545.11523, "r_y2": 75.20830999999998, "r_x3": 308.86206, "r_y3": 75.20830999999998, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 96.06988999999999, "r_x1": 339.98523, "r_y1": 96.06988999999999, "r_x2": 339.98523, "r_y2": 87.16332999999997, "r_x3": 308.86206, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.88931, "r_y0": 96.06988999999999, "r_x1": 545.11523, "r_y1": 96.06988999999999, "r_x2": 545.11523, "r_y2": 87.16332999999997, "r_x3": 346.88931, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 108.0249, "r_x1": 492.96097, "r_y1": 108.0249, "r_x2": 492.96097, "r_y2": 99.11835000000008, "r_x3": 308.86206, "r_y3": 99.11835000000008, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86206, "t": 116.22937000000002, "r": 545.1153, "b": 328.37405, "coord_origin": "TOPLEFT" }, "confidence": 0.9880930781364441, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 125.13593000000003, "r_x1": 545.11499, "r_y1": 125.13593000000003, "r_x2": 545.11499, "r_y2": 116.22937000000002, "r_x3": 320.81705, "r_y3": 116.22937000000002, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 137.09094000000005, "r_x1": 545.11517, "r_y1": 137.09094000000005, "r_x2": 545.11517, "r_y2": 128.18439, "r_x3": 308.86206, "r_y3": 128.18439, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 149.04596000000004, "r_x1": 545.11505, "r_y1": 149.04596000000004, "r_x2": 545.11505, "r_y2": 140.13940000000002, "r_x3": 308.86206, "r_y3": 140.13940000000002, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 161.00098000000003, "r_x1": 545.11511, "r_y1": 161.00098000000003, "r_x2": 545.11511, "r_y2": 152.09442, "r_x3": 308.86206, "r_y3": 152.09442, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 172.95599000000004, "r_x1": 545.11517, "r_y1": 172.95599000000004, "r_x2": 545.11517, "r_y2": 164.04944, "r_x3": 308.86206, "r_y3": 164.04944, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 184.91198999999995, "r_x1": 467.21756000000005, "r_y1": 184.91198999999995, "r_x2": 467.21756000000005, "r_y2": 176.00543000000005, "r_x3": 308.86206, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.43671, "r_y0": 184.91198999999995, "r_x1": 545.11511, "r_y1": 184.91198999999995, "r_x2": 545.11511, "r_y2": 176.00543000000005, "r_x3": 475.43671, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 196.86699999999996, "r_x1": 545.11511, "r_y1": 196.86699999999996, "r_x2": 545.11511, "r_y2": 187.96045000000004, "r_x3": 308.86206, "r_y3": 187.96045000000004, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 208.82201999999995, "r_x1": 545.11511, "r_y1": 208.82201999999995, "r_x2": 545.11511, "r_y2": 199.91547000000003, "r_x3": 308.86206, "r_y3": 199.91547000000003, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 220.77704000000006, "r_x1": 545.11517, "r_y1": 220.77704000000006, "r_x2": 545.11517, "r_y2": 211.87048000000004, "r_x3": 308.86206, "r_y3": 211.87048000000004, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 232.73206000000005, "r_x1": 545.11511, "r_y1": 232.73206000000005, "r_x2": 545.11511, "r_y2": 223.82550000000003, "r_x3": 308.86206, "r_y3": 223.82550000000003, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 244.68706999999995, "r_x1": 545.11511, "r_y1": 244.68706999999995, "r_x2": 545.11511, "r_y2": 235.78052000000002, "r_x3": 308.86206, "r_y3": 235.78052000000002, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 256.64306999999997, "r_x1": 545.11523, "r_y1": 256.64306999999997, "r_x2": 545.11523, "r_y2": 247.73650999999995, "r_x3": 308.86206, "r_y3": 247.73650999999995, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 268.59808, "r_x1": 342.3364, "r_y1": 268.59808, "r_x2": 342.3364, "r_y2": 259.69152999999994, "r_x3": 308.86206, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95157, "r_y0": 268.59808, "r_x1": 545.11517, "r_y1": 268.59808, "r_x2": 545.11517, "r_y2": 259.69152999999994, "r_x3": 348.95157, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 280.55310000000003, "r_x1": 545.11517, "r_y1": 280.55310000000003, "r_x2": 545.11517, "r_y2": 271.64655000000005, "r_x3": 308.86206, "r_y3": 271.64655000000005, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 292.50809, "r_x1": 545.1153, "r_y1": 292.50809, "r_x2": 545.1153, "r_y2": 283.6015300000001, "r_x3": 308.86206, "r_y3": 283.6015300000001, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 304.46307, "r_x1": 545.11511, "r_y1": 304.46307, "r_x2": 545.11511, "r_y2": 295.55652, "r_x3": 308.86206, "r_y3": 295.55652, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 316.41806, "r_x1": 545.11511, "r_y1": 316.41806, "r_x2": 545.11511, "r_y2": 307.51151, "r_x3": 308.86206, "r_y3": 307.51151, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 328.37405, "r_x1": 532.48267, "r_y1": 328.37405, "r_x2": 532.48267, "r_y2": 319.4674999999999, "r_x3": 308.86206, "r_y3": 319.4674999999999, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5." }, { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86203, "t": 336.57751, "r": 545.11517, "b": 429.16998, "coord_origin": "TOPLEFT" }, "confidence": 0.9877589344978333, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 345.48407000000003, "r_x1": 545.11499, "r_y1": 345.48407000000003, "r_x2": 545.11499, "r_y2": 336.57751, "r_x3": 320.81705, "r_y3": 336.57751, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 357.43906, "r_x1": 403.7359, "r_y1": 357.43906, "r_x2": 403.7359, "r_y2": 348.5325000000001, "r_x3": 308.86206, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.07605, "r_y0": 357.20993, "r_x1": 503.54016, "r_y1": 357.20993, "r_x2": 503.54016, "r_y2": 348.62216, "r_x3": 406.07605, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.53906, "r_y0": 357.43906, "r_x1": 506.02972, "r_y1": 357.43906, "r_x2": 506.02972, "r_y2": 348.5325000000001, "r_x3": 503.53906, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.40004999999996, "r_y0": 357.20993, "r_x1": 545.11224, "r_y1": 357.20993, "r_x2": 545.11224, "r_y2": 348.62216, "r_x3": 508.40004999999996, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 369.16492000000005, "r_x1": 343.1633, "r_y1": 369.16492000000005, "r_x2": 343.1633, "r_y2": 360.57715, "r_x3": 308.86206, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16306, "r_y0": 369.39404, "r_x1": 362.2016, "r_y1": 369.39404, "r_x2": 362.2016, "r_y2": 360.48749, "r_x3": 343.16306, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.28604, "r_y0": 369.16492000000005, "r_x1": 440.93829, "r_y1": 369.16492000000005, "r_x2": 440.93829, "r_y2": 360.57715, "r_x3": 364.28604, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.93903, "r_y0": 369.39404, "r_x1": 545.10797, "r_y1": 369.39404, "r_x2": 545.10797, "r_y2": 360.48749, "r_x3": 440.93903, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 381.34903, "r_x1": 545.11511, "r_y1": 381.34903, "r_x2": 545.11511, "r_y2": 372.44247, "r_x3": 308.86203, "r_y3": 372.44247, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 393.30502, "r_x1": 545.11517, "r_y1": 393.30502, "r_x2": 545.11517, "r_y2": 384.3984699999999, "r_x3": 308.86203, "r_y3": 384.3984699999999, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 405.04083, "r_x1": 314.67322, "r_y1": 405.04083, "r_x2": 314.67322, "r_y2": 396.19406000000004, "r_x3": 308.86203, "r_y3": 396.19406000000004, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.65802, "r_y0": 405.2600100000001, "r_x1": 360.39139, "r_y1": 405.2600100000001, "r_x2": 360.39139, "r_y2": 396.35345, "r_x3": 318.65802, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96295, "r_y0": 405.2600100000001, "r_x1": 545.10803, "r_y1": 405.2600100000001, "r_x2": 545.10803, "r_y2": 396.35345, "r_x3": 367.96295, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 417.215, "r_x1": 545.11511, "r_y1": 417.215, "r_x2": 545.11511, "r_y2": 408.30844, "r_x3": 308.86203, "r_y3": 408.30844, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 429.16998, "r_x1": 360.9664, "r_y1": 429.16998, "r_x2": 360.9664, "r_y2": 420.26343, "r_x3": 308.86203, "r_y3": 420.26343, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence." }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86203, "t": 437.37441999999993, "r": 545.11523, "b": 553.87689, "coord_origin": "TOPLEFT" }, "confidence": 0.9884491562843323, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 446.28098, "r_x1": 545.11499, "r_y1": 446.28098, "r_x2": 545.11499, "r_y2": 437.37441999999993, "r_x3": 320.81702, "r_y3": 437.37441999999993, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 458.23596, "r_x1": 384.62759, "r_y1": 458.23596, "r_x2": 384.62759, "r_y2": 449.32941, "r_x3": 308.86203, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37228, "r_y0": 458.23596, "r_x1": 545.11511, "r_y1": 458.23596, "r_x2": 545.11511, "r_y2": 449.32941, "r_x3": 391.37228, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 470.19095, "r_x1": 494.00693000000007, "r_y1": 470.19095, "r_x2": 494.00693000000007, "r_y2": 461.28439, "r_x3": 308.86203, "r_y3": 461.28439, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.07803, "r_y0": 469.96182, "r_x1": 545.11145, "r_y1": 469.96182, "r_x2": 545.11145, "r_y2": 461.37405, "r_x3": 498.07803, "r_y3": 461.37405, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 481.91681, "r_x1": 364.44336, "r_y1": 481.91681, "r_x2": 364.44336, "r_y2": 473.32904, "r_x3": 308.86203, "r_y3": 473.32904, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06104, "r_y0": 482.14594, "r_x1": 545.11267, "r_y1": 482.14594, "r_x2": 545.11267, "r_y2": 473.23938, "r_x3": 367.06104, "r_y3": 473.23938, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 494.10092, "r_x1": 545.11511, "r_y1": 494.10092, "r_x2": 545.11511, "r_y2": 485.19437, "r_x3": 308.86203, "r_y3": 485.19437, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 506.05591, "r_x1": 545.11523, "r_y1": 506.05591, "r_x2": 545.11523, "r_y2": 497.14935, "r_x3": 308.86203, "r_y3": 497.14935, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 518.0119, "r_x1": 545.11511, "r_y1": 518.0119, "r_x2": 545.11511, "r_y2": 509.10535, "r_x3": 308.86203, "r_y3": 509.10535, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 529.9668899999999, "r_x1": 545.11517, "r_y1": 529.9668899999999, "r_x2": 545.11517, "r_y2": 521.06033, "r_x3": 308.86203, "r_y3": 521.06033, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 541.9218900000001, "r_x1": 545.11517, "r_y1": 541.9218900000001, "r_x2": 545.11517, "r_y2": 533.01532, "r_x3": 308.86203, "r_y3": 533.01532, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 553.87689, "r_x1": 377.21548, "r_y1": 553.87689, "r_x2": 377.21548, "r_y2": 544.97034, "r_x3": 308.86203, "r_y3": 544.97034, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag." }, { "label": "section_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 308.86203, "t": 579.55432, "r": 397.44281, "b": 589.40637, "coord_origin": "TOPLEFT" }, "confidence": 0.9450808763504028, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 589.40637, "r_x1": 323.9046, "r_y1": 589.40637, "r_x2": 323.9046, "r_y2": 579.55432, "r_x3": 308.86203, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93301, "r_y0": 589.40637, "r_x1": 397.44281, "r_y1": 589.40637, "r_x2": 397.44281, "r_y2": 579.55432, "r_x3": 333.93301, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2. Generalization" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86203, "t": 603.44933, "r": 545.11517, "b": 672.13189, "coord_origin": "TOPLEFT" }, "confidence": 0.9880595803260803, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 612.3558800000001, "r_x1": 545.11493, "r_y1": 612.3558800000001, "r_x2": 545.11493, "r_y2": 603.44933, "r_x3": 320.81702, "r_y3": 603.44933, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 624.31088, "r_x1": 545.11511, "r_y1": 624.31088, "r_x2": 545.11511, "r_y2": 615.40433, "r_x3": 308.86203, "r_y3": 615.40433, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 636.26588, "r_x1": 545.11517, "r_y1": 636.26588, "r_x2": 545.11517, "r_y2": 627.35933, "r_x3": 308.86203, "r_y3": 627.35933, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 648.22089, "r_x1": 545.11511, "r_y1": 648.22089, "r_x2": 545.11511, "r_y2": 639.31433, "r_x3": 308.86203, "r_y3": 639.31433, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 660.17688, "r_x1": 545.11517, "r_y1": 660.17688, "r_x2": 545.11517, "r_y2": 651.27032, "r_x3": 308.86203, "r_y3": 651.27032, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 672.13189, "r_x1": 350.70493, "r_y1": 672.13189, "r_x2": 350.70493, "r_y2": 663.22533, "r_x3": 308.86203, "r_y3": 663.22533, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively." }, { "label": "text", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.86203, "t": 680.33533, "r": 545.11523, "b": 713.152893, "coord_origin": "TOPLEFT" }, "confidence": 0.9830910563468933, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 689.24189, "r_x1": 545.11505, "r_y1": 689.24189, "r_x2": 545.11505, "r_y2": 680.33533, "r_x3": 320.81702, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 701.196892, "r_x1": 396.21411, "r_y1": 701.196892, "r_x2": 396.21411, "r_y2": 692.290329, "r_x3": 308.86203, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.40585, "r_y0": 701.196892, "r_x1": 545.11523, "r_y1": 701.196892, "r_x2": 545.11523, "r_y2": 692.290329, "r_x3": 406.40585, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 713.152893, "r_x1": 495.93982, "r_y1": 713.152893, "r_x2": 495.93982, "r_y2": 704.246323, "r_x3": 308.86203, "r_y3": 704.246323, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized." }, { "label": "page_footer", "id": 17, "page_no": 5, "cluster": { "id": 17, "label": "page_footer", "bbox": { "l": 295.12103, "t": 734.133327, "r": 300.10233, "b": 743.03989, "coord_origin": "TOPLEFT" }, "confidence": 0.8820409178733826, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.03989, "r_x1": 300.10233, "r_y1": 743.03989, "r_x2": 300.10233, "r_y2": 734.133327, "r_x3": 295.12103, "r_y3": 734.133327, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" } ], "body": [ { "label": "text", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 286.36514, "b": 155.84600999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9868090152740479, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 286.36514, "r_y1": 84.11492999999996, "r_x2": 286.36514, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 96.06994999999995, "r_x1": 286.36508, "r_y1": 96.06994999999995, "r_x2": 286.36508, "r_y2": 87.16339000000005, "r_x3": 50.112, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 286.36508, "r_y1": 108.02495999999985, "r_x2": 286.36508, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 119.97997999999984, "r_x1": 286.36508, "r_y1": 119.97997999999984, "r_x2": 286.36508, "r_y2": 111.07343000000003, "r_x3": 50.112, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.93499999999995, "r_x1": 286.36508, "r_y1": 131.93499999999995, "r_x2": 286.36508, "r_y2": 123.02844000000005, "r_x3": 50.112, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 143.89099, "r_x1": 286.36514, "r_y1": 143.89099, "r_x2": 286.36514, "r_y2": 134.98443999999995, "r_x3": 50.112, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 155.84600999999998, "r_x1": 175.16254, "r_y1": 155.84600999999998, "r_x2": 175.16254, "r_y2": 146.93944999999997, "r_x3": 50.112, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.112, "t": 159.62445000000002, "r": 286.36511, "b": 240.26306, "coord_origin": "TOPLEFT" }, "confidence": 0.9860327839851379, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 168.53101000000004, "r_x1": 286.36496, "r_y1": 168.53101000000004, "r_x2": 286.36496, "r_y2": 159.62445000000002, "r_x3": 62.067001, "r_y3": 159.62445000000002, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 180.48699999999997, "r_x1": 286.36511, "r_y1": 180.48699999999997, "r_x2": 286.36511, "r_y2": 171.58043999999995, "r_x3": 50.112, "r_y3": 171.58043999999995, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 192.44201999999996, "r_x1": 286.36511, "r_y1": 192.44201999999996, "r_x2": 286.36511, "r_y2": 183.53545999999994, "r_x3": 50.112, "r_y3": 183.53545999999994, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 204.39702999999997, "r_x1": 286.36511, "r_y1": 204.39702999999997, "r_x2": 286.36511, "r_y2": 195.49048000000005, "r_x3": 50.112, "r_y3": 195.49048000000005, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 216.35204999999996, "r_x1": 286.36511, "r_y1": 216.35204999999996, "r_x2": 286.36511, "r_y2": 207.44550000000004, "r_x3": 50.112, "r_y3": 207.44550000000004, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 228.30706999999995, "r_x1": 286.36511, "r_y1": 228.30706999999995, "r_x2": 286.36511, "r_y2": 219.40051000000005, "r_x3": 50.112, "r_y3": 219.40051000000005, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 240.26306, "r_x1": 181.54855, "r_y1": 240.26306, "r_x2": 181.54855, "r_y2": 231.35650999999996, "r_x3": 50.112, "r_y3": 231.35650999999996, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer." }, { "label": "text", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.112, "t": 243.92193999999995, "r": 286.36572, "b": 444.2309, "coord_origin": "TOPLEFT" }, "confidence": 0.9873637557029724, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.87829999999997, "r_x1": 129.21492, "r_y1": 252.87829999999997, "r_x2": 129.21492, "r_y2": 243.92193999999995, "r_x3": 62.067001, "r_y3": 243.92193999999995, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.451, "r_y0": 252.94806000000005, "r_x1": 286.36078, "r_y1": 252.94806000000005, "r_x2": 286.36078, "r_y2": 244.04150000000004, "r_x3": 134.451, "r_y3": 244.04150000000004, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 264.90308000000005, "r_x1": 286.36511, "r_y1": 264.90308000000005, "r_x2": 286.36511, "r_y2": 255.99652000000003, "r_x3": 50.112007, "r_y3": 255.99652000000003, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 276.63989000000004, "r_x1": 56.84528, "r_y1": 276.63989000000004, "r_x2": 56.84528, "r_y2": 267.79309, "r_x3": 50.112007, "r_y3": 267.79309, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.343006, "r_y0": 276.85907, "r_x1": 135.39996, "r_y1": 276.85907, "r_x2": 135.39996, "r_y2": 267.95250999999996, "r_x3": 57.343006, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.735, "r_y0": 276.62994000000003, "r_x1": 211.07965, "r_y1": 276.62994000000003, "r_x2": 211.07965, "r_y2": 268.04218000000003, "r_x3": 137.735, "r_y3": 268.04218000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.63699, "r_y0": 276.85907, "r_x1": 286.36395, "r_y1": 276.85907, "r_x2": 286.36395, "r_y2": 267.95250999999996, "r_x3": 213.63699, "r_y3": 267.95250999999996, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.81406, "r_x1": 158.82388, "r_y1": 288.81406, "r_x2": 158.82388, "r_y2": 279.90747, "r_x3": 50.112, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.31799, "r_y0": 288.58493, "r_x1": 238.79712, "r_y1": 288.58493, "r_x2": 238.79712, "r_y2": 279.99712999999997, "r_x3": 161.31799, "r_y3": 279.99712999999997, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.521, "r_y0": 288.81406, "r_x1": 286.36264, "r_y1": 288.81406, "r_x2": 286.36264, "r_y2": 279.90747, "r_x3": 241.521, "r_y3": 279.90747, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.76904, "r_x1": 211.3766, "r_y1": 300.76904, "r_x2": 211.3766, "r_y2": 291.86249, "r_x3": 50.112, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.271, "r_y0": 300.54987, "r_x1": 229.19780000000003, "r_y1": 300.54987, "r_x2": 229.19780000000003, "r_y2": 291.70309, "r_x3": 214.271, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.696, "r_y0": 300.76904, "r_x1": 232.18665000000001, "r_y1": 300.76904, "r_x2": 232.18665000000001, "r_y2": 291.86249, "r_x3": 229.696, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49001, "r_y0": 300.54987, "r_x1": 251.41681000000003, "r_y1": 300.54987, "r_x2": 251.41681000000003, "r_y2": 291.70309, "r_x3": 236.49001, "r_y3": 291.70309, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81099999999998, "r_y0": 300.76904, "r_x1": 286.36255, "r_y1": 300.76904, "r_x2": 286.36255, "r_y2": 291.86249, "r_x3": 254.81099999999998, "r_y3": 291.86249, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.72403, "r_x1": 137.45412, "r_y1": 312.72403, "r_x2": 137.45412, "r_y2": 303.81747, "r_x3": 50.112, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.298, "r_y0": 312.50485, "r_x1": 148.24258, "r_y1": 312.50485, "r_x2": 148.24258, "r_y2": 303.65808, "r_x3": 141.298, "r_y3": 303.65808, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.58601, "r_y0": 312.72403, "r_x1": 286.36377, "r_y1": 312.72403, "r_x2": 286.36377, "r_y2": 303.81747, "r_x3": 152.58601, "r_y3": 303.81747, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 324.67902, "r_x1": 89.683464, "r_y1": 324.67902, "r_x2": 89.683464, "r_y2": 315.77245999999997, "r_x3": 50.112015, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.68602, "r_y0": 324.45984, "r_x1": 104.12046, "r_y1": 324.45984, "r_x2": 104.12046, "r_y2": 315.61307, "r_x3": 89.68602, "r_y3": 315.61307, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.61802, "r_y0": 324.67902, "r_x1": 286.36572, "r_y1": 324.67902, "r_x2": 286.36572, "r_y2": 315.77245999999997, "r_x3": 104.61802, "r_y3": 315.77245999999997, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 336.6350100000001, "r_x1": 286.36511, "r_y1": 336.6350100000001, "r_x2": 286.36511, "r_y2": 327.72845, "r_x3": 50.112019, "r_y3": 327.72845, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 348.59, "r_x1": 286.36508, "r_y1": 348.59, "r_x2": 286.36508, "r_y2": 339.68344, "r_x3": 50.112019, "r_y3": 339.68344, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 360.54498, "r_x1": 286.36511, "r_y1": 360.54498, "r_x2": 286.36511, "r_y2": 351.63843, "r_x3": 50.112019, "r_y3": 351.63843, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 372.49996999999996, "r_x1": 286.36508, "r_y1": 372.49996999999996, "r_x2": 286.36508, "r_y2": 363.59341, "r_x3": 50.112019, "r_y3": 363.59341, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 384.45496, "r_x1": 286.36511, "r_y1": 384.45496, "r_x2": 286.36511, "r_y2": 375.5484, "r_x3": 50.112019, "r_y3": 375.5484, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 396.40994, "r_x1": 286.36514, "r_y1": 396.40994, "r_x2": 286.36514, "r_y2": 387.50339, "r_x3": 50.112019, "r_y3": 387.50339, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112019, "r_y0": 408.36594, "r_x1": 88.68721, "r_y1": 408.36594, "r_x2": 88.68721, "r_y2": 399.45938, "r_x3": 50.112019, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.646019, "r_y0": 408.13681, "r_x1": 170.0517, "r_y1": 408.13681, "r_x2": 170.0517, "r_y2": 399.54904, "r_x3": 91.646019, "r_y3": 399.54904, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05103, "r_y0": 408.36594, "r_x1": 286.36438, "r_y1": 408.36594, "r_x2": 286.36438, "r_y2": 399.45938, "r_x3": 170.05103, "r_y3": 399.45938, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 420.32092, "r_x1": 181.96703, "r_y1": 420.32092, "r_x2": 181.96703, "r_y2": 411.41437, "r_x3": 50.112022, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09029, "r_y0": 420.32092, "r_x1": 197.74918, "r_y1": 420.32092, "r_x2": 197.74918, "r_y2": 411.41437, "r_x3": 189.09029, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.34789, "r_y0": 420.32092, "r_x1": 286.36511, "r_y1": 420.32092, "r_x2": 286.36511, "r_y2": 411.41437, "r_x3": 200.34789, "r_y3": 411.41437, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 432.27591, "r_x1": 286.36511, "r_y1": 432.27591, "r_x2": 286.36511, "r_y2": 423.36934999999994, "r_x3": 50.112022, "r_y3": 423.36934999999994, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 444.2309, "r_x1": 158.2959, "r_y1": 444.2309, "r_x2": 158.2959, "r_y2": 435.32434, "r_x3": 50.112022, "r_y3": 435.32434, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets." }, { "label": "text", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.112022, "t": 448.01035, "r": 286.36499, "b": 468.87189, "coord_origin": "TOPLEFT" }, "confidence": 0.9724196195602417, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067024, "r_y0": 456.9169, "r_x1": 286.36499, "r_y1": 456.9169, "r_x2": 286.36499, "r_y2": 448.01035, "r_x3": 62.067024, "r_y3": 448.01035, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 468.87189, "r_x1": 91.377113, "r_y1": 468.87189, "r_x2": 91.377113, "r_y2": 459.96533, "r_x3": 50.112022, "r_y3": 459.96533, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The loss used to train the TableFormer can be defined as following:" }, { "label": "formula", "id": 15, "page_no": 5, "cluster": { "id": 15, "label": "formula", "bbox": { "l": 124.33002, "t": 493.28094, "r": 286.36243, "b": 517.07172, "coord_origin": "TOPLEFT" }, "confidence": 0.9423348307609558, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.71502, "r_y0": 502.12772, "r_x1": 140.64182, "r_y1": 502.12772, "r_x2": 140.64182, "r_y2": 493.28094, "r_x3": 125.71502, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.90701, "r_y0": 502.12772, "r_x1": 151.65593, "r_y1": 502.12772, "r_x2": 151.65593, "r_y2": 493.28094, "r_x3": 143.90701, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42302, "r_y0": 502.12772, "r_x1": 186.62846, "r_y1": 502.12772, "r_x2": 186.62846, "r_y2": 493.28094, "r_x3": 154.42302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34003, "r_y0": 502.12772, "r_x1": 197.08894, "r_y1": 502.12772, "r_x2": 197.08894, "r_y2": 493.28094, "r_x3": 189.34003, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.30302, "r_y0": 502.12772, "r_x1": 211.64659, "r_y1": 502.12772, "r_x2": 211.64659, "r_y2": 493.28094, "r_x3": 199.30302, "r_y3": 493.28094, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33002, "r_y0": 517.07172, "r_x1": 127.30286, "r_y1": 517.07172, "r_x2": 127.30286, "r_y2": 508.22495, "r_x3": 124.33002, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.26602, "r_y0": 517.07172, "r_x1": 138.01494, "r_y1": 517.07172, "r_x2": 138.01494, "r_y2": 508.22495, "r_x3": 130.26602, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78203, "r_y0": 517.07172, "r_x1": 153.32629, "r_y1": 517.07172, "r_x2": 153.32629, "r_y2": 508.22495, "r_x3": 140.78203, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.03903, "r_y0": 517.07172, "r_x1": 174.85541, "r_y1": 517.07172, "r_x2": 174.85541, "r_y2": 508.22495, "r_x3": 156.03903, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07103, "r_y0": 517.07172, "r_x1": 184.81995, "r_y1": 517.07172, "r_x2": 184.81995, "r_y2": 507.66702, "r_x3": 177.07103, "r_y3": 507.66702, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03304, "r_y0": 517.07172, "r_x1": 192.84422, "r_y1": 517.07172, "r_x2": 192.84422, "r_y2": 508.22495, "r_x3": 187.03304, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.84503, "r_y0": 517.07172, "r_x1": 196.71948, "r_y1": 517.07172, "r_x2": 196.71948, "r_y2": 508.22495, "r_x3": 192.84503, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.71902, "r_y0": 517.07172, "r_x1": 211.64583, "r_y1": 517.07172, "r_x2": 211.64583, "r_y2": 508.22495, "r_x3": 196.71902, "r_y3": 508.22495, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74603, "r_y0": 509.91788, "r_x1": 286.36243, "r_y1": 509.91788, "r_x2": 286.36243, "r_y2": 501.01132, "r_x3": 274.74603, "r_y3": 501.01132, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)" }, { "label": "text", "id": 16, "page_no": 5, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.11203, "t": 530.5920100000001, "r": 281.59692, "b": 540.21588, "coord_origin": "TOPLEFT" }, "confidence": 0.9363929629325867, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 540.21588, "r_x1": 74.450661, "r_y1": 540.21588, "r_x2": 74.450661, "r_y2": 531.30933, "r_x3": 50.11203, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.941032, "r_y0": 539.9967, "r_x1": 82.75222, "r_y1": 539.9967, "r_x2": 82.75222, "r_y2": 531.14993, "r_x3": 76.941032, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.520035, "r_y0": 539.9967, "r_x1": 92.162102, "r_y1": 539.9967, "r_x2": 92.162102, "r_y2": 530.5920100000001, "r_x3": 85.520035, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.653038, "r_y0": 540.21588, "r_x1": 135.59932, "r_y1": 540.21588, "r_x2": 135.59932, "r_y2": 531.30933, "r_x3": 94.653038, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09004, "r_y0": 539.9967, "r_x1": 172.63162, "r_y1": 539.9967, "r_x2": 172.63162, "r_y2": 531.14993, "r_x3": 138.09004, "r_y3": 531.14993, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.89705, "r_y0": 539.9967, "r_x1": 192.50104, "r_y1": 539.9967, "r_x2": 192.50104, "r_y2": 530.5920100000001, "r_x3": 175.89705, "r_y3": 530.5920100000001, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99205, "r_y0": 540.21588, "r_x1": 281.59692, "r_y1": 540.21588, "r_x2": 281.59692, "r_y2": 531.30933, "r_x3": 194.99205, "r_y3": 531.30933, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters." }, { "label": "section_header", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.112045, "t": 555.91689, "r": 171.98335, "b": 566.66461, "coord_origin": "TOPLEFT" }, "confidence": 0.9554555416107178, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 566.66461, "r_x1": 57.92831799999999, "r_y1": 566.66461, "r_x2": 57.92831799999999, "r_y2": 555.91689, "r_x3": 50.112045, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.350014, "r_y0": 566.66461, "r_x1": 171.98335, "r_y1": 566.66461, "r_x2": 171.98335, "r_y2": 555.91689, "r_x3": 68.350014, "r_y3": 555.91689, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Experimental Results" }, { "label": "section_header", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.112045, "t": 576.26433, "r": 179.17502, "b": 586.1163799999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9538503289222717, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 586.1163799999999, "r_x1": 64.693237, "r_y1": 586.1163799999999, "r_x2": 64.693237, "r_y2": 576.26433, "r_x3": 50.112045, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.414032, "r_y0": 586.1163799999999, "r_x1": 179.17502, "r_y1": 586.1163799999999, "r_x2": 179.17502, "r_y2": 576.26433, "r_x3": 74.414032, "r_y3": 576.26433, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1. Implementation Details" }, { "label": "text", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.112045, "t": 595.73433, "r": 286.36517, "b": 640.50688, "coord_origin": "TOPLEFT" }, "confidence": 0.9856163263320923, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067047, "r_y0": 604.64088, "r_x1": 202.97806, "r_y1": 604.64088, "r_x2": 202.97806, "r_y2": 595.73433, "r_x3": 62.067047, "r_y3": 595.73433, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38405, "r_y0": 604.41174, "r_x1": 286.36008, "r_y1": 604.41174, "r_x2": 286.36008, "r_y2": 595.82399, "r_x3": 205.38405, "r_y3": 595.82399, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112045, "r_y0": 616.3667399999999, "r_x1": 70.037247, "r_y1": 616.3667399999999, "r_x2": 70.037247, "r_y2": 607.77899, "r_x3": 50.112045, "r_y3": 607.77899, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037048, "r_y0": 616.59589, "r_x1": 286.36496, "r_y1": 616.59589, "r_x2": 286.36496, "r_y2": 607.68933, "r_x3": 70.037048, "r_y3": 607.68933, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 628.55089, "r_x1": 286.36517, "r_y1": 628.55089, "r_x2": 286.36517, "r_y2": 619.64433, "r_x3": 50.112049, "r_y3": 619.64433, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112049, "r_y0": 640.50688, "r_x1": 207.03294, "r_y1": 640.50688, "r_x2": 207.03294, "r_y2": 631.60033, "r_x3": 50.112049, "r_y3": 631.60033, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:" }, { "label": "formula", "id": 18, "page_no": 5, "cluster": { "id": 18, "label": "formula", "bbox": { "l": 91.661049, "t": 653.828, "r": 286.36246, "b": 678.39588, "coord_origin": "TOPLEFT" }, "confidence": 0.844183623790741, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.661049, "r_y0": 663.45187, "r_x1": 186.01683, "r_y1": 663.45187, "r_x2": 186.01683, "r_y2": 654.54532, "r_x3": 91.661049, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.50705, "r_y0": 663.2327, "r_x1": 196.25597, "r_y1": 663.2327, "r_x2": 196.25597, "r_y2": 653.828, "r_x3": 188.50705, "r_y3": 653.828, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.74605, "r_y0": 663.45187, "r_x1": 244.81310999999997, "r_y1": 663.45187, "r_x2": 244.81310999999997, "r_y2": 654.54532, "r_x3": 198.74605, "r_y3": 654.54532, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.01604, "r_y0": 678.39588, "r_x1": 186.24606, "r_y1": 678.39588, "r_x2": 186.24606, "r_y2": 669.48932, "r_x3": 101.01604, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.73605, "r_y0": 678.1767, "r_x1": 196.48497, "r_y1": 678.1767, "r_x2": 196.48497, "r_y2": 668.77201, "r_x3": 188.73605, "r_y3": 668.77201, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.97505, "r_y0": 678.39588, "r_x1": 244.81296999999998, "r_y1": 678.39588, "r_x2": 244.81296999999998, "r_y2": 669.48932, "r_x3": 198.97505, "r_y3": 669.48932, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.74606, "r_y0": 671.02388, "r_x1": 286.36246, "r_y1": 671.02388, "r_x2": 286.36246, "r_y2": 662.11731, "r_x3": 274.74606, "r_y3": 662.11731, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)" }, { "label": "text", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.112061, "t": 692.290314, "r": 286.36514, "b": 713.151878, "coord_origin": "TOPLEFT" }, "confidence": 0.9724979996681213, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 701.196877, "r_x1": 286.36514, "r_y1": 701.196877, "r_x2": 286.36514, "r_y2": 692.290314, "r_x3": 50.112061, "r_y3": 692.290314, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112061, "r_y0": 713.151878, "r_x1": 286.36514, "r_y1": 713.151878, "r_x2": 286.36514, "r_y2": 704.245316, "r_x3": 50.112061, "r_y3": 704.245316, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved" }, { "label": "text", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.86206, "t": 75.20830999999998, "r": 545.11523, "b": 108.0249, "coord_origin": "TOPLEFT" }, "confidence": 0.9799237847328186, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 84.11487, "r_x1": 545.11523, "r_y1": 84.11487, "r_x2": 545.11523, "r_y2": 75.20830999999998, "r_x3": 308.86206, "r_y3": 75.20830999999998, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 96.06988999999999, "r_x1": 339.98523, "r_y1": 96.06988999999999, "r_x2": 339.98523, "r_y2": 87.16332999999997, "r_x3": 308.86206, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.88931, "r_y0": 96.06988999999999, "r_x1": 545.11523, "r_y1": 96.06988999999999, "r_x2": 545.11523, "r_y2": 87.16332999999997, "r_x3": 346.88931, "r_y3": 87.16332999999997, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 108.0249, "r_x1": 492.96097, "r_y1": 108.0249, "r_x2": 492.96097, "r_y2": 99.11835000000008, "r_x3": 308.86206, "r_y3": 99.11835000000008, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86206, "t": 116.22937000000002, "r": 545.1153, "b": 328.37405, "coord_origin": "TOPLEFT" }, "confidence": 0.9880930781364441, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 125.13593000000003, "r_x1": 545.11499, "r_y1": 125.13593000000003, "r_x2": 545.11499, "r_y2": 116.22937000000002, "r_x3": 320.81705, "r_y3": 116.22937000000002, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 137.09094000000005, "r_x1": 545.11517, "r_y1": 137.09094000000005, "r_x2": 545.11517, "r_y2": 128.18439, "r_x3": 308.86206, "r_y3": 128.18439, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 149.04596000000004, "r_x1": 545.11505, "r_y1": 149.04596000000004, "r_x2": 545.11505, "r_y2": 140.13940000000002, "r_x3": 308.86206, "r_y3": 140.13940000000002, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 161.00098000000003, "r_x1": 545.11511, "r_y1": 161.00098000000003, "r_x2": 545.11511, "r_y2": 152.09442, "r_x3": 308.86206, "r_y3": 152.09442, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 172.95599000000004, "r_x1": 545.11517, "r_y1": 172.95599000000004, "r_x2": 545.11517, "r_y2": 164.04944, "r_x3": 308.86206, "r_y3": 164.04944, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 184.91198999999995, "r_x1": 467.21756000000005, "r_y1": 184.91198999999995, "r_x2": 467.21756000000005, "r_y2": 176.00543000000005, "r_x3": 308.86206, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.43671, "r_y0": 184.91198999999995, "r_x1": 545.11511, "r_y1": 184.91198999999995, "r_x2": 545.11511, "r_y2": 176.00543000000005, "r_x3": 475.43671, "r_y3": 176.00543000000005, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 196.86699999999996, "r_x1": 545.11511, "r_y1": 196.86699999999996, "r_x2": 545.11511, "r_y2": 187.96045000000004, "r_x3": 308.86206, "r_y3": 187.96045000000004, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 208.82201999999995, "r_x1": 545.11511, "r_y1": 208.82201999999995, "r_x2": 545.11511, "r_y2": 199.91547000000003, "r_x3": 308.86206, "r_y3": 199.91547000000003, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 220.77704000000006, "r_x1": 545.11517, "r_y1": 220.77704000000006, "r_x2": 545.11517, "r_y2": 211.87048000000004, "r_x3": 308.86206, "r_y3": 211.87048000000004, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 232.73206000000005, "r_x1": 545.11511, "r_y1": 232.73206000000005, "r_x2": 545.11511, "r_y2": 223.82550000000003, "r_x3": 308.86206, "r_y3": 223.82550000000003, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 244.68706999999995, "r_x1": 545.11511, "r_y1": 244.68706999999995, "r_x2": 545.11511, "r_y2": 235.78052000000002, "r_x3": 308.86206, "r_y3": 235.78052000000002, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 256.64306999999997, "r_x1": 545.11523, "r_y1": 256.64306999999997, "r_x2": 545.11523, "r_y2": 247.73650999999995, "r_x3": 308.86206, "r_y3": 247.73650999999995, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 268.59808, "r_x1": 342.3364, "r_y1": 268.59808, "r_x2": 342.3364, "r_y2": 259.69152999999994, "r_x3": 308.86206, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95157, "r_y0": 268.59808, "r_x1": 545.11517, "r_y1": 268.59808, "r_x2": 545.11517, "r_y2": 259.69152999999994, "r_x3": 348.95157, "r_y3": 259.69152999999994, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 280.55310000000003, "r_x1": 545.11517, "r_y1": 280.55310000000003, "r_x2": 545.11517, "r_y2": 271.64655000000005, "r_x3": 308.86206, "r_y3": 271.64655000000005, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 292.50809, "r_x1": 545.1153, "r_y1": 292.50809, "r_x2": 545.1153, "r_y2": 283.6015300000001, "r_x3": 308.86206, "r_y3": 283.6015300000001, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 304.46307, "r_x1": 545.11511, "r_y1": 304.46307, "r_x2": 545.11511, "r_y2": 295.55652, "r_x3": 308.86206, "r_y3": 295.55652, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 316.41806, "r_x1": 545.11511, "r_y1": 316.41806, "r_x2": 545.11511, "r_y2": 307.51151, "r_x3": 308.86206, "r_y3": 307.51151, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 328.37405, "r_x1": 532.48267, "r_y1": 328.37405, "r_x2": 532.48267, "r_y2": 319.4674999999999, "r_x3": 308.86206, "r_y3": 319.4674999999999, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5." }, { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86203, "t": 336.57751, "r": 545.11517, "b": 429.16998, "coord_origin": "TOPLEFT" }, "confidence": 0.9877589344978333, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 345.48407000000003, "r_x1": 545.11499, "r_y1": 345.48407000000003, "r_x2": 545.11499, "r_y2": 336.57751, "r_x3": 320.81705, "r_y3": 336.57751, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 357.43906, "r_x1": 403.7359, "r_y1": 357.43906, "r_x2": 403.7359, "r_y2": 348.5325000000001, "r_x3": 308.86206, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.07605, "r_y0": 357.20993, "r_x1": 503.54016, "r_y1": 357.20993, "r_x2": 503.54016, "r_y2": 348.62216, "r_x3": 406.07605, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.53906, "r_y0": 357.43906, "r_x1": 506.02972, "r_y1": 357.43906, "r_x2": 506.02972, "r_y2": 348.5325000000001, "r_x3": 503.53906, "r_y3": 348.5325000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.40004999999996, "r_y0": 357.20993, "r_x1": 545.11224, "r_y1": 357.20993, "r_x2": 545.11224, "r_y2": 348.62216, "r_x3": 508.40004999999996, "r_y3": 348.62216, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 369.16492000000005, "r_x1": 343.1633, "r_y1": 369.16492000000005, "r_x2": 343.1633, "r_y2": 360.57715, "r_x3": 308.86206, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16306, "r_y0": 369.39404, "r_x1": 362.2016, "r_y1": 369.39404, "r_x2": 362.2016, "r_y2": 360.48749, "r_x3": 343.16306, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.28604, "r_y0": 369.16492000000005, "r_x1": 440.93829, "r_y1": 369.16492000000005, "r_x2": 440.93829, "r_y2": 360.57715, "r_x3": 364.28604, "r_y3": 360.57715, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.93903, "r_y0": 369.39404, "r_x1": 545.10797, "r_y1": 369.39404, "r_x2": 545.10797, "r_y2": 360.48749, "r_x3": 440.93903, "r_y3": 360.48749, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 381.34903, "r_x1": 545.11511, "r_y1": 381.34903, "r_x2": 545.11511, "r_y2": 372.44247, "r_x3": 308.86203, "r_y3": 372.44247, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 393.30502, "r_x1": 545.11517, "r_y1": 393.30502, "r_x2": 545.11517, "r_y2": 384.3984699999999, "r_x3": 308.86203, "r_y3": 384.3984699999999, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 405.04083, "r_x1": 314.67322, "r_y1": 405.04083, "r_x2": 314.67322, "r_y2": 396.19406000000004, "r_x3": 308.86203, "r_y3": 396.19406000000004, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.65802, "r_y0": 405.2600100000001, "r_x1": 360.39139, "r_y1": 405.2600100000001, "r_x2": 360.39139, "r_y2": 396.35345, "r_x3": 318.65802, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96295, "r_y0": 405.2600100000001, "r_x1": 545.10803, "r_y1": 405.2600100000001, "r_x2": 545.10803, "r_y2": 396.35345, "r_x3": 367.96295, "r_y3": 396.35345, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 417.215, "r_x1": 545.11511, "r_y1": 417.215, "r_x2": 545.11511, "r_y2": 408.30844, "r_x3": 308.86203, "r_y3": 408.30844, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 429.16998, "r_x1": 360.9664, "r_y1": 429.16998, "r_x2": 360.9664, "r_y2": 420.26343, "r_x3": 308.86203, "r_y3": 420.26343, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence." }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86203, "t": 437.37441999999993, "r": 545.11523, "b": 553.87689, "coord_origin": "TOPLEFT" }, "confidence": 0.9884491562843323, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 446.28098, "r_x1": 545.11499, "r_y1": 446.28098, "r_x2": 545.11499, "r_y2": 437.37441999999993, "r_x3": 320.81702, "r_y3": 437.37441999999993, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 458.23596, "r_x1": 384.62759, "r_y1": 458.23596, "r_x2": 384.62759, "r_y2": 449.32941, "r_x3": 308.86203, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37228, "r_y0": 458.23596, "r_x1": 545.11511, "r_y1": 458.23596, "r_x2": 545.11511, "r_y2": 449.32941, "r_x3": 391.37228, "r_y3": 449.32941, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 470.19095, "r_x1": 494.00693000000007, "r_y1": 470.19095, "r_x2": 494.00693000000007, "r_y2": 461.28439, "r_x3": 308.86203, "r_y3": 461.28439, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.07803, "r_y0": 469.96182, "r_x1": 545.11145, "r_y1": 469.96182, "r_x2": 545.11145, "r_y2": 461.37405, "r_x3": 498.07803, "r_y3": 461.37405, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 481.91681, "r_x1": 364.44336, "r_y1": 481.91681, "r_x2": 364.44336, "r_y2": 473.32904, "r_x3": 308.86203, "r_y3": 473.32904, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06104, "r_y0": 482.14594, "r_x1": 545.11267, "r_y1": 482.14594, "r_x2": 545.11267, "r_y2": 473.23938, "r_x3": 367.06104, "r_y3": 473.23938, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 494.10092, "r_x1": 545.11511, "r_y1": 494.10092, "r_x2": 545.11511, "r_y2": 485.19437, "r_x3": 308.86203, "r_y3": 485.19437, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 506.05591, "r_x1": 545.11523, "r_y1": 506.05591, "r_x2": 545.11523, "r_y2": 497.14935, "r_x3": 308.86203, "r_y3": 497.14935, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 518.0119, "r_x1": 545.11511, "r_y1": 518.0119, "r_x2": 545.11511, "r_y2": 509.10535, "r_x3": 308.86203, "r_y3": 509.10535, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 529.9668899999999, "r_x1": 545.11517, "r_y1": 529.9668899999999, "r_x2": 545.11517, "r_y2": 521.06033, "r_x3": 308.86203, "r_y3": 521.06033, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 541.9218900000001, "r_x1": 545.11517, "r_y1": 541.9218900000001, "r_x2": 545.11517, "r_y2": 533.01532, "r_x3": 308.86203, "r_y3": 533.01532, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 553.87689, "r_x1": 377.21548, "r_y1": 553.87689, "r_x2": 377.21548, "r_y2": 544.97034, "r_x3": 308.86203, "r_y3": 544.97034, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag." }, { "label": "section_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 308.86203, "t": 579.55432, "r": 397.44281, "b": 589.40637, "coord_origin": "TOPLEFT" }, "confidence": 0.9450808763504028, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 589.40637, "r_x1": 323.9046, "r_y1": 589.40637, "r_x2": 323.9046, "r_y2": 579.55432, "r_x3": 308.86203, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93301, "r_y0": 589.40637, "r_x1": 397.44281, "r_y1": 589.40637, "r_x2": 397.44281, "r_y2": 579.55432, "r_x3": 333.93301, "r_y3": 579.55432, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2. Generalization" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86203, "t": 603.44933, "r": 545.11517, "b": 672.13189, "coord_origin": "TOPLEFT" }, "confidence": 0.9880595803260803, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 612.3558800000001, "r_x1": 545.11493, "r_y1": 612.3558800000001, "r_x2": 545.11493, "r_y2": 603.44933, "r_x3": 320.81702, "r_y3": 603.44933, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 624.31088, "r_x1": 545.11511, "r_y1": 624.31088, "r_x2": 545.11511, "r_y2": 615.40433, "r_x3": 308.86203, "r_y3": 615.40433, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 636.26588, "r_x1": 545.11517, "r_y1": 636.26588, "r_x2": 545.11517, "r_y2": 627.35933, "r_x3": 308.86203, "r_y3": 627.35933, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 648.22089, "r_x1": 545.11511, "r_y1": 648.22089, "r_x2": 545.11511, "r_y2": 639.31433, "r_x3": 308.86203, "r_y3": 639.31433, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 660.17688, "r_x1": 545.11517, "r_y1": 660.17688, "r_x2": 545.11517, "r_y2": 651.27032, "r_x3": 308.86203, "r_y3": 651.27032, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 672.13189, "r_x1": 350.70493, "r_y1": 672.13189, "r_x2": 350.70493, "r_y2": 663.22533, "r_x3": 308.86203, "r_y3": 663.22533, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively." }, { "label": "text", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.86203, "t": 680.33533, "r": 545.11523, "b": 713.152893, "coord_origin": "TOPLEFT" }, "confidence": 0.9830910563468933, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 689.24189, "r_x1": 545.11505, "r_y1": 689.24189, "r_x2": 545.11505, "r_y2": 680.33533, "r_x3": 320.81702, "r_y3": 680.33533, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 701.196892, "r_x1": 396.21411, "r_y1": 701.196892, "r_x2": 396.21411, "r_y2": 692.290329, "r_x3": 308.86203, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.40585, "r_y0": 701.196892, "r_x1": 545.11523, "r_y1": 701.196892, "r_x2": 545.11523, "r_y2": 692.290329, "r_x3": 406.40585, "r_y3": 692.290329, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 713.152893, "r_x1": 495.93982, "r_y1": 713.152893, "r_x2": 495.93982, "r_y2": 704.246323, "r_x3": 308.86203, "r_y3": 704.246323, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized." } ], "headers": [ { "label": "page_footer", "id": 17, "page_no": 5, "cluster": { "id": 17, "label": "page_footer", "bbox": { "l": 295.12103, "t": 734.133327, "r": 300.10233, "b": 743.03989, "coord_origin": "TOPLEFT" }, "confidence": 0.8820409178733826, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.03989, "r_x1": 300.10233, "r_y1": 743.03989, "r_x2": 300.10233, "r_y2": 734.133327, "r_x3": 295.12103, "r_y3": 734.133327, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" } ] } }, { "page_no": 6, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.25342, "r_x1": 63.704811, "r_y1": 84.25342, "r_x2": 63.704811, "r_y2": 74.40137000000016, "r_x3": 50.112, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.766685, "r_y0": 84.25342, "r_x1": 167.89825, "r_y1": 84.25342, "r_x2": 167.89825, "r_y2": 74.40137000000016, "r_x3": 72.766685, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 102.25696000000016, "r_x1": 286.36499, "r_y1": 102.25696000000016, "r_x2": 286.36499, "r_y2": 93.35039999999992, "r_x3": 62.067001, "r_y3": 93.35039999999992, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 114.21198000000015, "r_x1": 286.36511, "r_y1": 114.21198000000015, "r_x2": 286.36511, "r_y2": 105.30542000000003, "r_x3": 50.112, "r_y3": 105.30542000000003, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 126.16699000000006, "r_x1": 286.36505, "r_y1": 126.16699000000006, "r_x2": 286.36505, "r_y2": 117.26044000000002, "r_x3": 50.112, "r_y3": 117.26044000000002, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 138.12298999999996, "r_x1": 136.71687, "r_y1": 138.12298999999996, "r_x2": 136.71687, "r_y2": 129.21642999999995, "r_x3": 50.112, "r_y3": 129.21642999999995, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.218994, "r_y0": 165.90479000000005, "r_x1": 118.8784, "r_y1": 165.90479000000005, "r_x2": 118.8784, "r_y2": 157.05798000000004, "r_x3": 86.218994, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87499, "r_y0": 165.90479000000005, "r_x1": 143.26962, "r_y1": 165.90479000000005, "r_x2": 143.26962, "r_y2": 157.05798000000004, "r_x3": 118.87499, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.76799, "r_y0": 165.90479000000005, "r_x1": 165.9019, "r_y1": 165.90479000000005, "r_x2": 165.9019, "r_y2": 157.05798000000004, "r_x3": 143.76799, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12099, "r_y0": 165.90479000000005, "r_x1": 175.8699, "r_y1": 165.90479000000005, "r_x2": 175.8699, "r_y2": 156.50012000000004, "r_x3": 168.12099, "r_y3": 156.50012000000004, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.27899, "r_y0": 159.16479000000004, "r_x1": 221.95677, "r_y1": 159.16479000000004, "r_x2": 221.95677, "r_y2": 150.31799, "r_x3": 179.27899, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95200000000003, "r_y0": 159.16479000000004, "r_x1": 246.34663, "r_y1": 159.16479000000004, "r_x2": 246.34663, "r_y2": 150.31799, "r_x3": 221.95200000000003, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84499999999997, "r_y0": 159.16479000000004, "r_x1": 250.71945, "r_y1": 159.16479000000004, "r_x2": 250.71945, "r_y2": 150.31799, "r_x3": 246.84499999999997, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21201, "r_y0": 172.73877000000005, "r_x1": 206.29161, "r_y1": 172.73877000000005, "r_x2": 206.29161, "r_y2": 163.89197000000001, "r_x3": 182.21201, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.289, "r_y0": 172.73877000000005, "r_x1": 209.05661, "r_y1": 172.73877000000005, "r_x2": 209.05661, "r_y2": 163.33411, "r_x3": 206.289, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.056, "r_y0": 172.73877000000005, "r_x1": 219.19968, "r_y1": 172.73877000000005, "r_x2": 219.19968, "r_y2": 163.89197000000001, "r_x3": 209.056, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.69700999999998, "r_y0": 172.73877000000005, "r_x1": 222.46461000000002, "r_y1": 172.73877000000005, "r_x2": 222.46461000000002, "r_y2": 163.33411, "r_x3": 219.69700999999998, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.125, "r_y0": 172.73877000000005, "r_x1": 226.89261, "r_y1": 172.73877000000005, "r_x2": 226.89261, "r_y2": 163.89197000000001, "r_x3": 224.125, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55299000000002, "r_y0": 172.73877000000005, "r_x1": 231.3206, "r_y1": 172.73877000000005, "r_x2": 231.3206, "r_y2": 163.33411, "r_x3": 228.55299000000002, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.31999, "r_y0": 172.73877000000005, "r_x1": 240.64563, "r_y1": 172.73877000000005, "r_x2": 240.64563, "r_y2": 163.89197000000001, "r_x3": 231.31999, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.144, "r_y0": 172.73877000000005, "r_x1": 243.91161, "r_y1": 172.73877000000005, "r_x2": 243.91161, "r_y2": 163.33411, "r_x3": 241.144, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.911, "r_y0": 172.73877000000005, "r_x1": 247.78545, "r_y1": 172.73877000000005, "r_x2": 247.78545, "r_y2": 163.89197000000001, "r_x3": 243.911, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 166.12396, "r_x1": 286.3624, "r_y1": 166.12396, "r_x2": 286.3624, "r_y2": 157.21740999999997, "r_x3": 274.746, "r_y3": 157.21740999999997, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 190.06897000000004, "r_x1": 86.405632, "r_y1": 190.06897000000004, "r_x2": 86.405632, "r_y2": 181.16241000000002, "r_x3": 62.067001, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.581001, "r_y0": 189.84978999999998, "r_x1": 98.724663, "r_y1": 189.84978999999998, "r_x2": 98.724663, "r_y2": 181.00298999999995, "r_x3": 88.581001, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.399, "r_y0": 190.06897000000004, "r_x1": 115.785, "r_y1": 190.06897000000004, "r_x2": 115.785, "r_y2": 181.16241000000002, "r_x3": 101.399, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.961, "r_y0": 189.84978999999998, "r_x1": 127.28664, "r_y1": 189.84978999999998, "r_x2": 127.28664, "r_y2": 181.00298999999995, "r_x3": 117.961, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.95999, "r_y0": 190.06897000000004, "r_x1": 286.36285, "r_y1": 190.06897000000004, "r_x2": 286.36285, "r_y2": 181.16241000000002, "r_x3": 129.95999, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 202.02399000000003, "r_x1": 252.78116000000003, "r_y1": 202.02399000000003, "r_x2": 252.78116000000003, "r_y2": 193.11743, "r_x3": 50.111992, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18201, "r_y0": 201.80480999999997, "r_x1": 257.94962, "r_y1": 201.80480999999997, "r_x2": 257.94962, "r_y2": 192.40015000000005, "r_x3": 255.18201, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.94901, "r_y0": 201.80480999999997, "r_x1": 263.77115, "r_y1": 201.80480999999997, "r_x2": 263.77115, "r_y2": 192.95800999999994, "r_x3": 257.94901, "r_y3": 192.95800999999994, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.155, "r_y0": 201.80480999999997, "r_x1": 267.92261, "r_y1": 201.80480999999997, "r_x2": 267.92261, "r_y2": 192.40015000000005, "r_x3": 265.155, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32199, "r_y0": 202.02399000000003, "r_x1": 286.36179, "r_y1": 202.02399000000003, "r_x2": 286.36179, "r_y2": 193.11743, "r_x3": 270.32199, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 213.97900000000004, "r_x1": 172.13388, "r_y1": 213.97900000000004, "r_x2": 172.13388, "r_y2": 205.07245, "r_x3": 50.111984, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62399, "r_y0": 213.75982999999997, "r_x1": 180.44614, "r_y1": 213.75982999999997, "r_x2": 180.44614, "r_y2": 204.91301999999996, "r_x3": 174.62399, "r_y3": 204.91301999999996, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.82899, "r_y0": 213.97900000000004, "r_x1": 184.31964, "r_y1": 213.97900000000004, "r_x2": 184.31964, "r_y2": 205.07245, "r_x3": 181.82899, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 234.67151, "r_x1": 64.551605, "r_y1": 234.67151, "r_x2": 64.551605, "r_y2": 224.81946000000005, "r_x3": 50.112, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.178009, "r_y0": 234.67151, "r_x1": 170.45169, "r_y1": 234.67151, "r_x2": 170.45169, "r_y2": 224.81946000000005, "r_x3": 74.178009, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.60626000000002, "r_x1": 105.32461, "r_y1": 252.60626000000002, "r_x2": 105.32461, "r_y2": 243.6499, "r_x3": 62.067001, "r_y3": 243.6499, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.12600000000002, "r_y0": 252.67602999999997, "r_x1": 184.68361, "r_y1": 252.67602999999997, "r_x2": 184.68361, "r_y2": 243.76946999999996, "r_x3": 112.12600000000002, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.4781, "r_y0": 252.67602999999997, "r_x1": 286.36188, "r_y1": 252.67602999999997, "r_x2": 286.36188, "r_y2": 243.76946999999996, "r_x3": 191.4781, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.63104, "r_x1": 286.36508, "r_y1": 264.63104, "r_x2": 286.36508, "r_y2": 255.72448999999995, "r_x3": 50.112, "r_y3": 255.72448999999995, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.58606, "r_x1": 286.36508, "r_y1": 276.58606, "r_x2": 286.36508, "r_y2": 267.67949999999996, "r_x3": 50.112, "r_y3": 267.67949999999996, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.54105, "r_x1": 286.36508, "r_y1": 288.54105, "r_x2": 286.36508, "r_y2": 279.63446, "r_x3": 50.112, "r_y3": 279.63446, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.49704, "r_x1": 286.36514, "r_y1": 300.49704, "r_x2": 286.36514, "r_y2": 291.59048, "r_x3": 50.112, "r_y3": 291.59048, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.45203000000004, "r_x1": 286.36508, "r_y1": 312.45203000000004, "r_x2": 286.36508, "r_y2": 303.54547, "r_x3": 50.112, "r_y3": 303.54547, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.40700999999996, "r_x1": 286.36505, "r_y1": 324.40700999999996, "r_x2": 286.36505, "r_y2": 315.50046, "r_x3": 50.112, "r_y3": 315.50046, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.362, "r_x1": 286.36508, "r_y1": 336.362, "r_x2": 286.36508, "r_y2": 327.45544, "r_x3": 50.112, "r_y3": 327.45544, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.31699000000003, "r_x1": 286.36508, "r_y1": 348.31699000000003, "r_x2": 286.36508, "r_y2": 339.41043, "r_x3": 50.112, "r_y3": 339.41043, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 360.27197, "r_x1": 286.36505, "r_y1": 360.27197, "r_x2": 286.36505, "r_y2": 351.36542, "r_x3": 50.112, "r_y3": 351.36542, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 372.2279700000001, "r_x1": 286.36508, "r_y1": 372.2279700000001, "r_x2": 286.36508, "r_y2": 363.32141, "r_x3": 50.112, "r_y3": 363.32141, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 384.18295000000006, "r_x1": 286.36511, "r_y1": 384.18295000000006, "r_x2": 286.36511, "r_y2": 375.2764, "r_x3": 50.112, "r_y3": 375.2764, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.13794, "r_x1": 170.01187, "r_y1": 396.13794, "r_x2": 170.01187, "r_y2": 387.23138, "r_x3": 50.112, "r_y3": 387.23138, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 601.33992, "r_x1": 286.36511, "r_y1": 601.33992, "r_x2": 286.36511, "r_y2": 592.43336, "r_x3": 50.112, "r_y3": 592.43336, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 613.29492, "r_x1": 247.46114, "r_y1": 613.29492, "r_x2": 247.46114, "r_y2": 604.38837, "r_x3": 50.112, "r_y3": 604.38837, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 625.24992, "r_x1": 261.78732, "r_y1": 625.24992, "r_x2": 261.78732, "r_y2": 616.34337, "r_x3": 50.112, "r_y3": 616.34337, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 653.30618, "r_x1": 124.72179, "r_y1": 653.30618, "r_x2": 124.72179, "r_y2": 644.3498099999999, "r_x3": 62.067001, "r_y3": 644.3498099999999, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.20401, "r_y0": 653.37592, "r_x1": 242.9333, "r_y1": 653.37592, "r_x2": 242.9333, "r_y2": 644.46936, "r_x3": 128.20401, "r_y3": 644.46936, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55401999999998, "r_y0": 653.1467700000001, "r_x1": 286.36084, "r_y1": 653.1467700000001, "r_x2": 286.36084, "r_y2": 644.55902, "r_x3": 245.55401999999998, "r_y3": 644.55902, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.10178, "r_x1": 84.971146, "r_y1": 665.10178, "r_x2": 84.971146, "r_y2": 656.51402, "r_x3": 50.112015, "r_y3": 656.51402, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.515015, "r_y0": 665.33092, "r_x1": 286.366, "r_y1": 665.33092, "r_x2": 286.366, "r_y2": 656.42436, "r_x3": 89.515015, "r_y3": 656.42436, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28593, "r_x1": 286.36511, "r_y1": 677.28593, "r_x2": 286.36511, "r_y2": 668.37936, "r_x3": 50.112015, "r_y3": 668.37936, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24193, "r_x1": 286.36505, "r_y1": 689.24193, "r_x2": 286.36505, "r_y2": 680.33536, "r_x3": 50.112015, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.19693, "r_x1": 286.36511, "r_y1": 701.19693, "r_x2": 286.36511, "r_y2": 692.290359, "r_x3": 50.112015, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151932, "r_x1": 286.36508, "r_y1": 713.151932, "r_x2": 286.36508, "r_y2": 704.245361, "r_x3": 50.112015, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 322.14215, "r_y1": 84.11492999999996, "r_x2": 322.14215, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45401, "r_y0": 83.88580000000002, "r_x1": 404.56702, "r_y1": 83.88580000000002, "r_x2": 404.56702, "r_y2": 75.29803000000004, "r_x3": 325.45401, "r_y3": 75.29803000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.104, "r_y0": 84.11492999999996, "r_x1": 545.10968, "r_y1": 84.11492999999996, "r_x2": 545.10968, "r_y2": 75.20836999999995, "r_x3": 408.104, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11511, "r_y1": 96.06994999999995, "r_x2": 545.11511, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 470.22626, "r_y1": 108.02495999999985, "r_x2": 470.22626, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.52884, "r_y0": 108.02495999999985, "r_x1": 545.11511, "r_y1": 108.02495999999985, "r_x2": 545.11511, "r_y2": 99.11841000000004, "r_x3": 477.52884, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 119.97997999999984, "r_x1": 545.11517, "r_y1": 119.97997999999984, "r_x2": 545.11517, "r_y2": 111.07343000000003, "r_x3": 308.862, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 131.93499999999995, "r_x1": 545.11511, "r_y1": 131.93499999999995, "r_x2": 545.11511, "r_y2": 123.02844000000005, "r_x3": 308.862, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 143.89099, "r_x1": 502.01691000000005, "r_y1": 143.89099, "r_x2": 502.01691000000005, "r_y2": 134.98443999999995, "r_x3": 308.862, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47299, "r_y0": 143.66187000000002, "r_x1": 545.11041, "r_y1": 143.66187000000002, "r_x2": 545.11041, "r_y2": 135.07410000000004, "r_x3": 504.47299, "r_y3": 135.07410000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 155.61688000000004, "r_x1": 343.16324, "r_y1": 155.61688000000004, "r_x2": 343.16324, "r_y2": 147.02910999999995, "r_x3": 308.862, "r_y3": 147.02910999999995, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.371, "r_y0": 155.84600999999998, "r_x1": 545.11493, "r_y1": 155.84600999999998, "r_x2": 545.11493, "r_y2": 146.93944999999997, "r_x3": 346.371, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 167.80102999999997, "r_x1": 446.15652, "r_y1": 167.80102999999997, "r_x2": 446.15652, "r_y2": 158.89446999999996, "r_x3": 308.862, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.28998000000007, "r_y0": 167.57190000000003, "r_x1": 525.04181, "r_y1": 167.57190000000003, "r_x2": 525.04181, "r_y2": 158.98413000000005, "r_x3": 448.28998000000007, "r_y3": 158.98413000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.39899, "r_y0": 167.80102999999997, "r_x1": 545.11249, "r_y1": 167.80102999999997, "r_x2": 545.11249, "r_y2": 158.89446999999996, "r_x3": 527.39899, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 179.75603999999998, "r_x1": 545.11511, "r_y1": 179.75603999999998, "r_x2": 545.11511, "r_y2": 170.84948999999995, "r_x3": 308.862, "r_y3": 170.84948999999995, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 191.71105999999997, "r_x1": 432.86642000000006, "r_y1": 191.71105999999997, "r_x2": 432.86642000000006, "r_y2": 182.80449999999996, "r_x3": 308.862, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39001, "r_y0": 191.48193000000003, "r_x1": 510.93021, "r_y1": 191.48193000000003, "r_x2": 510.93021, "r_y2": 182.89417000000003, "r_x3": 436.39001, "r_y3": 182.89417000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.677, "r_y0": 191.71105999999997, "r_x1": 545.11273, "r_y1": 191.71105999999997, "r_x2": 545.11273, "r_y2": 182.80449999999996, "r_x3": 514.677, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 203.66607999999997, "r_x1": 431.17285, "r_y1": 203.66607999999997, "r_x2": 431.17285, "r_y2": 194.75951999999995, "r_x3": 308.862, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6790199999999, "r_y0": 203.43695000000002, "r_x1": 514.18054, "r_y1": 203.43695000000002, "r_x2": 514.18054, "r_y2": 194.84918000000005, "r_x3": 434.6790199999999, "r_y3": 194.84918000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.17603, "r_y0": 203.66607999999997, "r_x1": 545.10992, "r_y1": 203.66607999999997, "r_x2": 545.10992, "r_y2": 194.75951999999995, "r_x3": 514.17603, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 215.39293999999995, "r_x1": 382.35614, "r_y1": 215.39293999999995, "r_x2": 382.35614, "r_y2": 206.80517999999995, "r_x3": 308.86203, "r_y3": 206.80517999999995, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.07501, "r_y0": 215.62207, "r_x1": 545.11426, "r_y1": 215.62207, "r_x2": 545.11426, "r_y2": 206.71551999999997, "r_x3": 385.07501, "r_y3": 206.71551999999997, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 227.57709, "r_x1": 501.6981799999999, "r_y1": 227.57709, "r_x2": 501.6981799999999, "r_y2": 218.67052999999999, "r_x3": 308.862, "r_y3": 218.67052999999999, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 325.35587, "r_x1": 341.49951, "r_y1": 325.35587, "r_x2": 341.49951, "r_y2": 316.44931, "r_x3": 308.862, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.60284, "r_y0": 325.35587, "r_x1": 545.11517, "r_y1": 325.35587, "r_x2": 545.11517, "r_y2": 316.44931, "r_x3": 348.60284, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.3108500000001, "r_x1": 474.97845, "r_y1": 337.3108500000001, "r_x2": 474.97845, "r_y2": 328.4043, "r_x3": 308.862, "r_y3": 328.4043, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 376.63611, "r_x1": 378.94876, "r_y1": 376.63611, "r_x2": 378.94876, "r_y2": 367.6797199999999, "r_x3": 320.81699, "r_y3": 367.6797199999999, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.07898, "r_y0": 376.70584, "r_x1": 545.11566, "r_y1": 376.70584, "r_x2": 545.11566, "r_y2": 367.79929, "r_x3": 387.07898, "r_y3": 367.79929, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 388.66083, "r_x1": 487.19257, "r_y1": 388.66083, "r_x2": 487.19257, "r_y2": 379.75426999999996, "r_x3": 308.86197, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.96713, "r_y0": 388.66083, "r_x1": 545.11511, "r_y1": 388.66083, "r_x2": 545.11511, "r_y2": 379.75426999999996, "r_x3": 493.96713, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 400.61581, "r_x1": 545.11505, "r_y1": 400.61581, "r_x2": 545.11505, "r_y2": 391.70926, "r_x3": 308.86197, "r_y3": 391.70926, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 412.57181, "r_x1": 545.11523, "r_y1": 412.57181, "r_x2": 545.11523, "r_y2": 403.66525, "r_x3": 308.86197, "r_y3": 403.66525, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 424.52679, "r_x1": 314.08096, "r_y1": 424.52679, "r_x2": 314.08096, "r_y2": 415.62024, "r_x3": 308.86197, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69046, "r_y0": 424.52679, "r_x1": 545.11517, "r_y1": 424.52679, "r_x2": 545.11517, "r_y2": 415.62024, "r_x3": 316.69046, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 436.48177999999996, "r_x1": 545.11505, "r_y1": 436.48177999999996, "r_x2": 545.11505, "r_y2": 427.57523, "r_x3": 308.86197, "r_y3": 427.57523, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 448.43677, "r_x1": 545.11505, "r_y1": 448.43677, "r_x2": 545.11505, "r_y2": 439.53021, "r_x3": 308.86197, "r_y3": 439.53021, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 460.39175, "r_x1": 350.23666, "r_y1": 460.39175, "r_x2": 350.23666, "r_y2": 451.4852, "r_x3": 308.86197, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.17596, "r_y0": 460.32201999999995, "r_x1": 374.59183, "r_y1": 460.32201999999995, "r_x2": 374.59183, "r_y2": 451.36563, "r_x3": 352.17596, "r_y3": 451.36563, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53296, "r_y0": 460.39175, "r_x1": 545.11011, "r_y1": 460.39175, "r_x2": 545.11011, "r_y2": 451.4852, "r_x3": 376.53296, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 472.34674, "r_x1": 545.11511, "r_y1": 472.34674, "r_x2": 545.11511, "r_y2": 463.44019, "r_x3": 308.86197, "r_y3": 463.44019, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 484.30273, "r_x1": 545.11517, "r_y1": 484.30273, "r_x2": 545.11517, "r_y2": 475.39618, "r_x3": 308.86197, "r_y3": 475.39618, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 496.25772, "r_x1": 545.11511, "r_y1": 496.25772, "r_x2": 545.11511, "r_y2": 487.35117, "r_x3": 308.86197, "r_y3": 487.35117, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 508.21271, "r_x1": 545.11505, "r_y1": 508.21271, "r_x2": 545.11505, "r_y2": 499.30615, "r_x3": 308.86197, "r_y3": 499.30615, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 520.16769, "r_x1": 405.69846, "r_y1": 520.16769, "r_x2": 405.69846, "r_y2": 511.26114, "r_x3": 308.86197, "r_y3": 511.26114, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.76792, "r_x1": 341.73862, "r_y1": 665.76792, "r_x2": 341.73862, "r_y2": 656.86136, "r_x3": 308.862, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.55927, "r_y0": 665.76792, "r_x1": 545.11517, "r_y1": 665.76792, "r_x2": 545.11517, "r_y2": 656.86136, "r_x3": 349.55927, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.7229199999999, "r_x1": 545.11505, "r_y1": 677.7229199999999, "r_x2": 545.11505, "r_y2": 668.81636, "r_x3": 308.862, "r_y3": 668.81636, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.6779300000001, "r_x1": 435.03836, "r_y1": 689.6779300000001, "r_x2": 435.03836, "r_y2": 680.77136, "r_x3": 308.862, "r_y3": 680.77136, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039921, "r_x1": 300.10229, "r_y1": 743.039921, "r_x2": 300.10229, "r_y2": 734.133358, "r_x3": 295.121, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "section_header", "bbox": { "l": 50.112, "t": 74.40137000000016, "r": 167.89825, "b": 84.25342, "coord_origin": "TOPLEFT" }, "confidence": 0.9554274082183838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.25342, "r_x1": 63.704811, "r_y1": 84.25342, "r_x2": 63.704811, "r_y2": 74.40137000000016, "r_x3": 50.112, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.766685, "r_y0": 84.25342, "r_x1": 167.89825, "r_y1": 84.25342, "r_x2": 167.89825, "r_y2": 74.40137000000016, "r_x3": 72.766685, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 93.35039999999992, "r": 286.36511, "b": 138.12298999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9862998127937317, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 102.25696000000016, "r_x1": 286.36499, "r_y1": 102.25696000000016, "r_x2": 286.36499, "r_y2": 93.35039999999992, "r_x3": 62.067001, "r_y3": 93.35039999999992, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 114.21198000000015, "r_x1": 286.36511, "r_y1": 114.21198000000015, "r_x2": 286.36511, "r_y2": 105.30542000000003, "r_x3": 50.112, "r_y3": 105.30542000000003, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 126.16699000000006, "r_x1": 286.36505, "r_y1": 126.16699000000006, "r_x2": 286.36505, "r_y2": 117.26044000000002, "r_x3": 50.112, "r_y3": 117.26044000000002, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 138.12298999999996, "r_x1": 136.71687, "r_y1": 138.12298999999996, "r_x2": 136.71687, "r_y2": 129.21642999999995, "r_x3": 50.112, "r_y3": 129.21642999999995, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "formula", "bbox": { "l": 86.218994, "t": 150.31799, "r": 286.3624, "b": 172.73877000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9500409364700317, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.218994, "r_y0": 165.90479000000005, "r_x1": 118.8784, "r_y1": 165.90479000000005, "r_x2": 118.8784, "r_y2": 157.05798000000004, "r_x3": 86.218994, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87499, "r_y0": 165.90479000000005, "r_x1": 143.26962, "r_y1": 165.90479000000005, "r_x2": 143.26962, "r_y2": 157.05798000000004, "r_x3": 118.87499, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.76799, "r_y0": 165.90479000000005, "r_x1": 165.9019, "r_y1": 165.90479000000005, "r_x2": 165.9019, "r_y2": 157.05798000000004, "r_x3": 143.76799, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12099, "r_y0": 165.90479000000005, "r_x1": 175.8699, "r_y1": 165.90479000000005, "r_x2": 175.8699, "r_y2": 156.50012000000004, "r_x3": 168.12099, "r_y3": 156.50012000000004, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.27899, "r_y0": 159.16479000000004, "r_x1": 221.95677, "r_y1": 159.16479000000004, "r_x2": 221.95677, "r_y2": 150.31799, "r_x3": 179.27899, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95200000000003, "r_y0": 159.16479000000004, "r_x1": 246.34663, "r_y1": 159.16479000000004, "r_x2": 246.34663, "r_y2": 150.31799, "r_x3": 221.95200000000003, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84499999999997, "r_y0": 159.16479000000004, "r_x1": 250.71945, "r_y1": 159.16479000000004, "r_x2": 250.71945, "r_y2": 150.31799, "r_x3": 246.84499999999997, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21201, "r_y0": 172.73877000000005, "r_x1": 206.29161, "r_y1": 172.73877000000005, "r_x2": 206.29161, "r_y2": 163.89197000000001, "r_x3": 182.21201, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.289, "r_y0": 172.73877000000005, "r_x1": 209.05661, "r_y1": 172.73877000000005, "r_x2": 209.05661, "r_y2": 163.33411, "r_x3": 206.289, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.056, "r_y0": 172.73877000000005, "r_x1": 219.19968, "r_y1": 172.73877000000005, "r_x2": 219.19968, "r_y2": 163.89197000000001, "r_x3": 209.056, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.69700999999998, "r_y0": 172.73877000000005, "r_x1": 222.46461000000002, "r_y1": 172.73877000000005, "r_x2": 222.46461000000002, "r_y2": 163.33411, "r_x3": 219.69700999999998, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.125, "r_y0": 172.73877000000005, "r_x1": 226.89261, "r_y1": 172.73877000000005, "r_x2": 226.89261, "r_y2": 163.89197000000001, "r_x3": 224.125, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55299000000002, "r_y0": 172.73877000000005, "r_x1": 231.3206, "r_y1": 172.73877000000005, "r_x2": 231.3206, "r_y2": 163.33411, "r_x3": 228.55299000000002, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.31999, "r_y0": 172.73877000000005, "r_x1": 240.64563, "r_y1": 172.73877000000005, "r_x2": 240.64563, "r_y2": 163.89197000000001, "r_x3": 231.31999, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.144, "r_y0": 172.73877000000005, "r_x1": 243.91161, "r_y1": 172.73877000000005, "r_x2": 243.91161, "r_y2": 163.33411, "r_x3": 241.144, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.911, "r_y0": 172.73877000000005, "r_x1": 247.78545, "r_y1": 172.73877000000005, "r_x2": 247.78545, "r_y2": 163.89197000000001, "r_x3": 243.911, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 166.12396, "r_x1": 286.3624, "r_y1": 166.12396, "r_x2": 286.3624, "r_y2": 157.21740999999997, "r_x3": 274.746, "r_y3": 157.21740999999997, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 50.111984, "t": 181.00298999999995, "r": 286.36285, "b": 213.97900000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9735319018363953, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 190.06897000000004, "r_x1": 86.405632, "r_y1": 190.06897000000004, "r_x2": 86.405632, "r_y2": 181.16241000000002, "r_x3": 62.067001, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.581001, "r_y0": 189.84978999999998, "r_x1": 98.724663, "r_y1": 189.84978999999998, "r_x2": 98.724663, "r_y2": 181.00298999999995, "r_x3": 88.581001, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.399, "r_y0": 190.06897000000004, "r_x1": 115.785, "r_y1": 190.06897000000004, "r_x2": 115.785, "r_y2": 181.16241000000002, "r_x3": 101.399, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.961, "r_y0": 189.84978999999998, "r_x1": 127.28664, "r_y1": 189.84978999999998, "r_x2": 127.28664, "r_y2": 181.00298999999995, "r_x3": 117.961, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.95999, "r_y0": 190.06897000000004, "r_x1": 286.36285, "r_y1": 190.06897000000004, "r_x2": 286.36285, "r_y2": 181.16241000000002, "r_x3": 129.95999, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 202.02399000000003, "r_x1": 252.78116000000003, "r_y1": 202.02399000000003, "r_x2": 252.78116000000003, "r_y2": 193.11743, "r_x3": 50.111992, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18201, "r_y0": 201.80480999999997, "r_x1": 257.94962, "r_y1": 201.80480999999997, "r_x2": 257.94962, "r_y2": 192.40015000000005, "r_x3": 255.18201, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.94901, "r_y0": 201.80480999999997, "r_x1": 263.77115, "r_y1": 201.80480999999997, "r_x2": 263.77115, "r_y2": 192.95800999999994, "r_x3": 257.94901, "r_y3": 192.95800999999994, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.155, "r_y0": 201.80480999999997, "r_x1": 267.92261, "r_y1": 201.80480999999997, "r_x2": 267.92261, "r_y2": 192.40015000000005, "r_x3": 265.155, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32199, "r_y0": 202.02399000000003, "r_x1": 286.36179, "r_y1": 202.02399000000003, "r_x2": 286.36179, "r_y2": 193.11743, "r_x3": 270.32199, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 213.97900000000004, "r_x1": 172.13388, "r_y1": 213.97900000000004, "r_x2": 172.13388, "r_y2": 205.07245, "r_x3": 50.111984, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62399, "r_y0": 213.75982999999997, "r_x1": 180.44614, "r_y1": 213.75982999999997, "r_x2": 180.44614, "r_y2": 204.91301999999996, "r_x3": 174.62399, "r_y3": 204.91301999999996, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.82899, "r_y0": 213.97900000000004, "r_x1": 184.31964, "r_y1": 213.97900000000004, "r_x2": 184.31964, "r_y2": 205.07245, "r_x3": 181.82899, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "section_header", "bbox": { "l": 50.112, "t": 224.81946000000005, "r": 170.45169, "b": 234.67151, "coord_origin": "TOPLEFT" }, "confidence": 0.9588837027549744, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 234.67151, "r_x1": 64.551605, "r_y1": 234.67151, "r_x2": 64.551605, "r_y2": 224.81946000000005, "r_x3": 50.112, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.178009, "r_y0": 234.67151, "r_x1": 170.45169, "r_y1": 234.67151, "r_x2": 170.45169, "r_y2": 224.81946000000005, "r_x3": 74.178009, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.112, "t": 243.6499, "r": 286.36514, "b": 396.13794, "coord_origin": "TOPLEFT" }, "confidence": 0.9855090975761414, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.60626000000002, "r_x1": 105.32461, "r_y1": 252.60626000000002, "r_x2": 105.32461, "r_y2": 243.6499, "r_x3": 62.067001, "r_y3": 243.6499, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.12600000000002, "r_y0": 252.67602999999997, "r_x1": 184.68361, "r_y1": 252.67602999999997, "r_x2": 184.68361, "r_y2": 243.76946999999996, "r_x3": 112.12600000000002, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.4781, "r_y0": 252.67602999999997, "r_x1": 286.36188, "r_y1": 252.67602999999997, "r_x2": 286.36188, "r_y2": 243.76946999999996, "r_x3": 191.4781, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.63104, "r_x1": 286.36508, "r_y1": 264.63104, "r_x2": 286.36508, "r_y2": 255.72448999999995, "r_x3": 50.112, "r_y3": 255.72448999999995, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.58606, "r_x1": 286.36508, "r_y1": 276.58606, "r_x2": 286.36508, "r_y2": 267.67949999999996, "r_x3": 50.112, "r_y3": 267.67949999999996, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.54105, "r_x1": 286.36508, "r_y1": 288.54105, "r_x2": 286.36508, "r_y2": 279.63446, "r_x3": 50.112, "r_y3": 279.63446, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.49704, "r_x1": 286.36514, "r_y1": 300.49704, "r_x2": 286.36514, "r_y2": 291.59048, "r_x3": 50.112, "r_y3": 291.59048, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.45203000000004, "r_x1": 286.36508, "r_y1": 312.45203000000004, "r_x2": 286.36508, "r_y2": 303.54547, "r_x3": 50.112, "r_y3": 303.54547, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.40700999999996, "r_x1": 286.36505, "r_y1": 324.40700999999996, "r_x2": 286.36505, "r_y2": 315.50046, "r_x3": 50.112, "r_y3": 315.50046, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.362, "r_x1": 286.36508, "r_y1": 336.362, "r_x2": 286.36508, "r_y2": 327.45544, "r_x3": 50.112, "r_y3": 327.45544, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.31699000000003, "r_x1": 286.36508, "r_y1": 348.31699000000003, "r_x2": 286.36508, "r_y2": 339.41043, "r_x3": 50.112, "r_y3": 339.41043, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 360.27197, "r_x1": 286.36505, "r_y1": 360.27197, "r_x2": 286.36505, "r_y2": 351.36542, "r_x3": 50.112, "r_y3": 351.36542, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 372.2279700000001, "r_x1": 286.36508, "r_y1": 372.2279700000001, "r_x2": 286.36508, "r_y2": 363.32141, "r_x3": 50.112, "r_y3": 363.32141, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 384.18295000000006, "r_x1": 286.36511, "r_y1": 384.18295000000006, "r_x2": 286.36511, "r_y2": 375.2764, "r_x3": 50.112, "r_y3": 375.2764, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.13794, "r_x1": 170.01187, "r_y1": 396.13794, "r_x2": 170.01187, "r_y2": 387.23138, "r_x3": 50.112, "r_y3": 387.23138, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT" }, "confidence": 0.9892510175704956, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.843002, "t": 420.69037, "r": 104.85535, "b": 429.59692, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71237, "r": 236.10649, "b": 423.61893, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.338, "t": 426.66736, "r": 159.21584, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17096, "t": 426.66736, "r": 199.40497, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36009, "t": 426.66736, "r": 247.74349999999998, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54044, "t": 426.66736, "r": 277.27264, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.612, "t": 443.62436, "r": 102.08514, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87206, "t": 443.62436, "r": 153.69141, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.56554, "t": 443.62436, "r": 194.00009, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.82938000000001, "t": 443.62436, "r": 238.26393, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18414, "t": 443.62436, "r": 279.61868, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.165001, "t": 455.58035, "r": 101.5323, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.86716, "t": 455.58035, "r": 153.68651, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62411, "t": 455.58035, "r": 186.94167, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.88795000000002, "t": 455.58035, "r": 231.20551, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.69855, "t": 455.58035, "r": 282.11441, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.315002, "t": 468.13336, "r": 117.38329000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.86766, "t": 468.13336, "r": 153.68701, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57111, "t": 468.13336, "r": 194.00566, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83495, "t": 468.13336, "r": 238.26950000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.698, "t": 468.01379, "r": 282.11386, "b": 476.97018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.612, "t": 483.32635, "r": 102.08514, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87206, "t": 483.32635, "r": 153.69141, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.56554, "t": 483.32635, "r": 194.00009, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.33870999999996, "t": 483.32635, "r": 240.75455999999997, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18411, "t": 483.32635, "r": 279.61865, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.165001, "t": 495.28134, "r": 101.5323, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.86716, "t": 495.28134, "r": 153.68651, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62411, "t": 495.28134, "r": 186.94167, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.88795000000002, "t": 495.28134, "r": 231.20551, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.69855, "t": 495.28134, "r": 282.11441, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.789001, "t": 507.23633, "r": 111.90838999999998, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86221, "t": 507.23633, "r": 153.68156, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.62914, "t": 507.23633, "r": 186.94669, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89297, "t": 507.23633, "r": 231.21053000000003, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.6936, "t": 507.23633, "r": 282.10947, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.315002, "t": 519.1913099999999, "r": 117.38329000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.86766, "t": 519.1913099999999, "r": 153.68701, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57111, "t": 519.1913099999999, "r": 194.00566, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83495, "t": 519.1913099999999, "r": 238.26950000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.189, "t": 519.0717500000001, "r": 279.62354, "b": 528.02814, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.612, "t": 536.49837, "r": 102.08514, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91064, "t": 536.49837, "r": 150.64285, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.56554, "t": 536.49837, "r": 194.00009, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89285, "t": 536.49837, "r": 231.21040000000002, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18411, "t": 536.49837, "r": 279.61865, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.315002, "t": 548.45436, "r": 117.38329000000002, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.90625, "t": 548.45436, "r": 150.63846, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57111, "t": 548.45436, "r": 194.00566, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.88845999999998, "t": 548.45436, "r": 231.20601, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.189, "t": 548.3348100000001, "r": 279.62354, "b": 557.2911799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.315002, "t": 568.00237, "r": 117.38329000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.86766, "t": 568.00237, "r": 153.68701, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57111, "t": 568.00237, "r": 194.00566, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83495, "t": 568.00237, "r": 238.26950000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.1897, "t": 568.00237, "r": 279.62424, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 15, "label": "text", "bbox": { "l": 50.112, "t": 592.43336, "r": 286.36511, "b": 613.29492, "coord_origin": "TOPLEFT" }, "confidence": 0.7209173440933228, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 601.33992, "r_x1": 286.36511, "r_y1": 601.33992, "r_x2": 286.36511, "r_y2": 592.43336, "r_x3": 50.112, "r_y3": 592.43336, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 613.29492, "r_x1": 247.46114, "r_y1": 613.29492, "r_x2": 247.46114, "r_y2": 604.38837, "r_x3": 50.112, "r_y3": 604.38837, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 50.112, "t": 616.34337, "r": 261.78732, "b": 625.24992, "coord_origin": "TOPLEFT" }, "confidence": 0.6433312892913818, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 625.24992, "r_x1": 261.78732, "r_y1": 625.24992, "r_x2": 261.78732, "r_y2": 616.34337, "r_x3": 50.112, "r_y3": 616.34337, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.112015, "t": 644.3498099999999, "r": 286.366, "b": 713.151932, "coord_origin": "TOPLEFT" }, "confidence": 0.9854635000228882, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 653.30618, "r_x1": 124.72179, "r_y1": 653.30618, "r_x2": 124.72179, "r_y2": 644.3498099999999, "r_x3": 62.067001, "r_y3": 644.3498099999999, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.20401, "r_y0": 653.37592, "r_x1": 242.9333, "r_y1": 653.37592, "r_x2": 242.9333, "r_y2": 644.46936, "r_x3": 128.20401, "r_y3": 644.46936, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55401999999998, "r_y0": 653.1467700000001, "r_x1": 286.36084, "r_y1": 653.1467700000001, "r_x2": 286.36084, "r_y2": 644.55902, "r_x3": 245.55401999999998, "r_y3": 644.55902, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.10178, "r_x1": 84.971146, "r_y1": 665.10178, "r_x2": 84.971146, "r_y2": 656.51402, "r_x3": 50.112015, "r_y3": 656.51402, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.515015, "r_y0": 665.33092, "r_x1": 286.366, "r_y1": 665.33092, "r_x2": 286.366, "r_y2": 656.42436, "r_x3": 89.515015, "r_y3": 656.42436, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28593, "r_x1": 286.36511, "r_y1": 677.28593, "r_x2": 286.36511, "r_y2": 668.37936, "r_x3": 50.112015, "r_y3": 668.37936, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24193, "r_x1": 286.36505, "r_y1": 689.24193, "r_x2": 286.36505, "r_y2": 680.33536, "r_x3": 50.112015, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.19693, "r_x1": 286.36511, "r_y1": 701.19693, "r_x2": 286.36511, "r_y2": 692.290359, "r_x3": 50.112015, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151932, "r_x1": 286.36508, "r_y1": 713.151932, "r_x2": 286.36508, "r_y2": 704.245361, "r_x3": 50.112015, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 308.862, "t": 75.20836999999995, "r": 545.11517, "b": 227.57709, "coord_origin": "TOPLEFT" }, "confidence": 0.9713197946548462, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 322.14215, "r_y1": 84.11492999999996, "r_x2": 322.14215, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45401, "r_y0": 83.88580000000002, "r_x1": 404.56702, "r_y1": 83.88580000000002, "r_x2": 404.56702, "r_y2": 75.29803000000004, "r_x3": 325.45401, "r_y3": 75.29803000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.104, "r_y0": 84.11492999999996, "r_x1": 545.10968, "r_y1": 84.11492999999996, "r_x2": 545.10968, "r_y2": 75.20836999999995, "r_x3": 408.104, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11511, "r_y1": 96.06994999999995, "r_x2": 545.11511, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 470.22626, "r_y1": 108.02495999999985, "r_x2": 470.22626, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.52884, "r_y0": 108.02495999999985, "r_x1": 545.11511, "r_y1": 108.02495999999985, "r_x2": 545.11511, "r_y2": 99.11841000000004, "r_x3": 477.52884, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 119.97997999999984, "r_x1": 545.11517, "r_y1": 119.97997999999984, "r_x2": 545.11517, "r_y2": 111.07343000000003, "r_x3": 308.862, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 131.93499999999995, "r_x1": 545.11511, "r_y1": 131.93499999999995, "r_x2": 545.11511, "r_y2": 123.02844000000005, "r_x3": 308.862, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 143.89099, "r_x1": 502.01691000000005, "r_y1": 143.89099, "r_x2": 502.01691000000005, "r_y2": 134.98443999999995, "r_x3": 308.862, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47299, "r_y0": 143.66187000000002, "r_x1": 545.11041, "r_y1": 143.66187000000002, "r_x2": 545.11041, "r_y2": 135.07410000000004, "r_x3": 504.47299, "r_y3": 135.07410000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 155.61688000000004, "r_x1": 343.16324, "r_y1": 155.61688000000004, "r_x2": 343.16324, "r_y2": 147.02910999999995, "r_x3": 308.862, "r_y3": 147.02910999999995, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.371, "r_y0": 155.84600999999998, "r_x1": 545.11493, "r_y1": 155.84600999999998, "r_x2": 545.11493, "r_y2": 146.93944999999997, "r_x3": 346.371, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 167.80102999999997, "r_x1": 446.15652, "r_y1": 167.80102999999997, "r_x2": 446.15652, "r_y2": 158.89446999999996, "r_x3": 308.862, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.28998000000007, "r_y0": 167.57190000000003, "r_x1": 525.04181, "r_y1": 167.57190000000003, "r_x2": 525.04181, "r_y2": 158.98413000000005, "r_x3": 448.28998000000007, "r_y3": 158.98413000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.39899, "r_y0": 167.80102999999997, "r_x1": 545.11249, "r_y1": 167.80102999999997, "r_x2": 545.11249, "r_y2": 158.89446999999996, "r_x3": 527.39899, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 179.75603999999998, "r_x1": 545.11511, "r_y1": 179.75603999999998, "r_x2": 545.11511, "r_y2": 170.84948999999995, "r_x3": 308.862, "r_y3": 170.84948999999995, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 191.71105999999997, "r_x1": 432.86642000000006, "r_y1": 191.71105999999997, "r_x2": 432.86642000000006, "r_y2": 182.80449999999996, "r_x3": 308.862, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39001, "r_y0": 191.48193000000003, "r_x1": 510.93021, "r_y1": 191.48193000000003, "r_x2": 510.93021, "r_y2": 182.89417000000003, "r_x3": 436.39001, "r_y3": 182.89417000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.677, "r_y0": 191.71105999999997, "r_x1": 545.11273, "r_y1": 191.71105999999997, "r_x2": 545.11273, "r_y2": 182.80449999999996, "r_x3": 514.677, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 203.66607999999997, "r_x1": 431.17285, "r_y1": 203.66607999999997, "r_x2": 431.17285, "r_y2": 194.75951999999995, "r_x3": 308.862, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6790199999999, "r_y0": 203.43695000000002, "r_x1": 514.18054, "r_y1": 203.43695000000002, "r_x2": 514.18054, "r_y2": 194.84918000000005, "r_x3": 434.6790199999999, "r_y3": 194.84918000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.17603, "r_y0": 203.66607999999997, "r_x1": 545.10992, "r_y1": 203.66607999999997, "r_x2": 545.10992, "r_y2": 194.75951999999995, "r_x3": 514.17603, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 215.39293999999995, "r_x1": 382.35614, "r_y1": 215.39293999999995, "r_x2": 382.35614, "r_y2": 206.80517999999995, "r_x3": 308.86203, "r_y3": 206.80517999999995, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.07501, "r_y0": 215.62207, "r_x1": 545.11426, "r_y1": 215.62207, "r_x2": 545.11426, "r_y2": 206.71551999999997, "r_x3": 385.07501, "r_y3": 206.71551999999997, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 227.57709, "r_x1": 501.6981799999999, "r_y1": 227.57709, "r_x2": 501.6981799999999, "r_y2": 218.67052999999999, "r_x3": 308.862, "r_y3": 218.67052999999999, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT" }, "confidence": 0.9691730737686157, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.323, "t": 253.66436999999996, "r": 365.33536, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04132, "t": 253.66436999999996, "r": 430.91916, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.10214, "t": 253.66436999999996, "r": 474.58523999999994, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54034, "t": 253.66436999999996, "r": 527.2276, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.65601, "t": 270.62134000000003, "r": 377.00076, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.69809, "t": 270.62134000000003, "r": 438.28073, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.63559, "t": 270.62134000000003, "r": 473.07013, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.16592, "t": 270.62134000000003, "r": 515.60046, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.79501, "t": 282.57631999999995, "r": 377.86331, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69388, "t": 282.57631999999995, "r": 438.27652, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63101, "t": 282.45676, "r": 473.06555000000003, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.1713, "t": 282.45676, "r": 515.60583, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.79501, "t": 294.53131, "r": 377.86331, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.81842, "t": 294.53131, "r": 442.15194999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63135, "t": 294.53131, "r": 473.06589, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.22515999999996, "t": 294.53131, "r": 508.54268999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 12, "label": "caption", "bbox": { "l": 308.862, "t": 316.44931, "r": 545.11517, "b": 337.3108500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9519917964935303, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 325.35587, "r_x1": 341.49951, "r_y1": 325.35587, "r_x2": 341.49951, "r_y2": 316.44931, "r_x3": 308.862, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.60284, "r_y0": 325.35587, "r_x1": 545.11517, "r_y1": 325.35587, "r_x2": 545.11517, "r_y2": 316.44931, "r_x3": 348.60284, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.3108500000001, "r_x1": 474.97845, "r_y1": 337.3108500000001, "r_x2": 474.97845, "r_y2": 328.4043, "r_x3": 308.862, "r_y3": 328.4043, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 308.86197, "t": 367.6797199999999, "r": 545.11566, "b": 520.16769, "coord_origin": "TOPLEFT" }, "confidence": 0.9835010766983032, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 376.63611, "r_x1": 378.94876, "r_y1": 376.63611, "r_x2": 378.94876, "r_y2": 367.6797199999999, "r_x3": 320.81699, "r_y3": 367.6797199999999, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.07898, "r_y0": 376.70584, "r_x1": 545.11566, "r_y1": 376.70584, "r_x2": 545.11566, "r_y2": 367.79929, "r_x3": 387.07898, "r_y3": 367.79929, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 388.66083, "r_x1": 487.19257, "r_y1": 388.66083, "r_x2": 487.19257, "r_y2": 379.75426999999996, "r_x3": 308.86197, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.96713, "r_y0": 388.66083, "r_x1": 545.11511, "r_y1": 388.66083, "r_x2": 545.11511, "r_y2": 379.75426999999996, "r_x3": 493.96713, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 400.61581, "r_x1": 545.11505, "r_y1": 400.61581, "r_x2": 545.11505, "r_y2": 391.70926, "r_x3": 308.86197, "r_y3": 391.70926, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 412.57181, "r_x1": 545.11523, "r_y1": 412.57181, "r_x2": 545.11523, "r_y2": 403.66525, "r_x3": 308.86197, "r_y3": 403.66525, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 424.52679, "r_x1": 314.08096, "r_y1": 424.52679, "r_x2": 314.08096, "r_y2": 415.62024, "r_x3": 308.86197, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69046, "r_y0": 424.52679, "r_x1": 545.11517, "r_y1": 424.52679, "r_x2": 545.11517, "r_y2": 415.62024, "r_x3": 316.69046, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 436.48177999999996, "r_x1": 545.11505, "r_y1": 436.48177999999996, "r_x2": 545.11505, "r_y2": 427.57523, "r_x3": 308.86197, "r_y3": 427.57523, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 448.43677, "r_x1": 545.11505, "r_y1": 448.43677, "r_x2": 545.11505, "r_y2": 439.53021, "r_x3": 308.86197, "r_y3": 439.53021, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 460.39175, "r_x1": 350.23666, "r_y1": 460.39175, "r_x2": 350.23666, "r_y2": 451.4852, "r_x3": 308.86197, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.17596, "r_y0": 460.32201999999995, "r_x1": 374.59183, "r_y1": 460.32201999999995, "r_x2": 374.59183, "r_y2": 451.36563, "r_x3": 352.17596, "r_y3": 451.36563, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53296, "r_y0": 460.39175, "r_x1": 545.11011, "r_y1": 460.39175, "r_x2": 545.11011, "r_y2": 451.4852, "r_x3": 376.53296, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 472.34674, "r_x1": 545.11511, "r_y1": 472.34674, "r_x2": 545.11511, "r_y2": 463.44019, "r_x3": 308.86197, "r_y3": 463.44019, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 484.30273, "r_x1": 545.11517, "r_y1": 484.30273, "r_x2": 545.11517, "r_y2": 475.39618, "r_x3": 308.86197, "r_y3": 475.39618, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 496.25772, "r_x1": 545.11511, "r_y1": 496.25772, "r_x2": 545.11511, "r_y2": 487.35117, "r_x3": 308.86197, "r_y3": 487.35117, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 508.21271, "r_x1": 545.11505, "r_y1": 508.21271, "r_x2": 545.11505, "r_y2": 499.30615, "r_x3": 308.86197, "r_y3": 499.30615, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 520.16769, "r_x1": 405.69846, "r_y1": 520.16769, "r_x2": 405.69846, "r_y2": 511.26114, "r_x3": 308.86197, "r_y3": 511.26114, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "table", "bbox": { "l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT" }, "confidence": 0.9775567650794983, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01099, "t": 552.23337, "r": 384.02335, "b": 561.1399200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03400000000005, "t": 546.25537, "r": 473.94049000000007, "b": 555.16193, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.50598, "t": 558.21037, "r": 436.73999, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.6951, "t": 558.21037, "r": 485.07849, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.3848, "t": 558.21037, "r": 512.117, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68201, "t": 575.16736, "r": 384.3519, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.90097, "t": 575.16736, "r": 431.33550999999994, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16479000000004, "t": 575.16736, "r": 475.59933000000007, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.0289, "t": 575.16736, "r": 514.46344, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72299, "t": 587.12236, "r": 391.31064, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.90582, "t": 587.12236, "r": 431.34036, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.16965, "t": 587.12236, "r": 475.60419, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03374999999994, "t": 587.12236, "r": 514.46832, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.13599, "t": 599.07835, "r": 387.89923, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.90161, "t": 599.07835, "r": 431.33615, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.16544, "t": 599.07835, "r": 475.59998, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.02954000000005, "t": 599.07835, "r": 514.46411, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.55899, "t": 611.03336, "r": 395.47534, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.90616, "t": 611.03336, "r": 431.34069999999997, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.16998000000007, "t": 611.03336, "r": 475.60452, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03409, "t": 611.03336, "r": 514.46863, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78101, "t": 622.9883600000001, "r": 381.25415, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.90158, "t": 622.9883600000001, "r": 431.33612, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.16541, "t": 622.9883600000001, "r": 475.59995000000004, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.0295100000001, "t": 622.9883600000001, "r": 514.46405, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.483, "t": 634.94336, "r": 396.5513, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.90616, "t": 634.94336, "r": 431.34069999999997, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.16998000000007, "t": 634.94336, "r": 475.60452, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03400000000005, "t": 634.82381, "r": 514.46857, "b": 643.78018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 11, "label": "caption", "bbox": { "l": 308.862, "t": 656.86136, "r": 545.11517, "b": 689.6779300000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9541404247283936, "cells": [ { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.76792, "r_x1": 341.73862, "r_y1": 665.76792, "r_x2": 341.73862, "r_y2": 656.86136, "r_x3": 308.862, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.55927, "r_y0": 665.76792, "r_x1": 545.11517, "r_y1": 665.76792, "r_x2": 545.11517, "r_y2": 656.86136, "r_x3": 349.55927, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.7229199999999, "r_x1": 545.11505, "r_y1": 677.7229199999999, "r_x2": 545.11505, "r_y2": 668.81636, "r_x3": 308.862, "r_y3": 668.81636, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.6779300000001, "r_x1": 435.03836, "r_y1": 689.6779300000001, "r_x2": 435.03836, "r_y2": 680.77136, "r_x3": 308.862, "r_y3": 680.77136, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133358, "r": 300.10229, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.8787972331047058, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039921, "r_x1": 300.10229, "r_y1": 743.039921, "r_x2": 300.10229, "r_y2": 734.133358, "r_x3": 295.121, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "table", "bbox": { "l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT" }, "confidence": 0.9892510175704956, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.843002, "t": 420.69037, "r": 104.85535, "b": 429.59692, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71237, "r": 236.10649, "b": 423.61893, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.338, "t": 426.66736, "r": 159.21584, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17096, "t": 426.66736, "r": 199.40497, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36009, "t": 426.66736, "r": 247.74349999999998, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54044, "t": 426.66736, "r": 277.27264, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.612, "t": 443.62436, "r": 102.08514, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87206, "t": 443.62436, "r": 153.69141, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.56554, "t": 443.62436, "r": 194.00009, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.82938000000001, "t": 443.62436, "r": 238.26393, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18414, "t": 443.62436, "r": 279.61868, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.165001, "t": 455.58035, "r": 101.5323, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.86716, "t": 455.58035, "r": 153.68651, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62411, "t": 455.58035, "r": 186.94167, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.88795000000002, "t": 455.58035, "r": 231.20551, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.69855, "t": 455.58035, "r": 282.11441, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.315002, "t": 468.13336, "r": 117.38329000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.86766, "t": 468.13336, "r": 153.68701, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57111, "t": 468.13336, "r": 194.00566, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83495, "t": 468.13336, "r": 238.26950000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.698, "t": 468.01379, "r": 282.11386, "b": 476.97018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.612, "t": 483.32635, "r": 102.08514, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87206, "t": 483.32635, "r": 153.69141, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.56554, "t": 483.32635, "r": 194.00009, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.33870999999996, "t": 483.32635, "r": 240.75455999999997, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18411, "t": 483.32635, "r": 279.61865, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.165001, "t": 495.28134, "r": 101.5323, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.86716, "t": 495.28134, "r": 153.68651, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62411, "t": 495.28134, "r": 186.94167, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.88795000000002, "t": 495.28134, "r": 231.20551, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.69855, "t": 495.28134, "r": 282.11441, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.789001, "t": 507.23633, "r": 111.90838999999998, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86221, "t": 507.23633, "r": 153.68156, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.62914, "t": 507.23633, "r": 186.94669, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89297, "t": 507.23633, "r": 231.21053000000003, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.6936, "t": 507.23633, "r": 282.10947, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.315002, "t": 519.1913099999999, "r": 117.38329000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.86766, "t": 519.1913099999999, "r": 153.68701, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57111, "t": 519.1913099999999, "r": 194.00566, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83495, "t": 519.1913099999999, "r": 238.26950000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.189, "t": 519.0717500000001, "r": 279.62354, "b": 528.02814, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.612, "t": 536.49837, "r": 102.08514, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91064, "t": 536.49837, "r": 150.64285, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.56554, "t": 536.49837, "r": 194.00009, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89285, "t": 536.49837, "r": 231.21040000000002, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18411, "t": 536.49837, "r": 279.61865, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.315002, "t": 548.45436, "r": 117.38329000000002, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.90625, "t": 548.45436, "r": 150.63846, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57111, "t": 548.45436, "r": 194.00566, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.88845999999998, "t": 548.45436, "r": 231.20601, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.189, "t": 548.3348100000001, "r": 279.62354, "b": 557.2911799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.315002, "t": 568.00237, "r": 117.38329000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.86766, "t": 568.00237, "r": 153.68701, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57111, "t": 568.00237, "r": 194.00566, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83495, "t": 568.00237, "r": 238.26950000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.1897, "t": 568.00237, "r": 279.62424, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 11, "num_cols": 5, "table_cells": [ { "bbox": { "l": 78.843002, "t": 420.69037, "r": 104.85535, "b": 429.59692, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 211.2, "t": 414.71237, "r": 236.10649, "b": 423.61893, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 129.338, "t": 426.66736, "r": 159.21584, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 171.17096, "t": 426.66736, "r": 199.40497, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 264.54044, "t": 426.66736, "r": 277.27264, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 443.62436, "r": 102.08514, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87206, "t": 443.62436, "r": 153.69141, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 443.62436, "r": 194.00009, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.82938000000001, "t": 443.62436, "r": 238.26393, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18414, "t": 443.62436, "r": 279.61868, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.165001, "t": 455.58035, "r": 101.5323, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86716, "t": 455.58035, "r": 153.68651, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62411, "t": 455.58035, "r": 186.94167, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88795000000002, "t": 455.58035, "r": 231.20551, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69855, "t": 455.58035, "r": 282.11441, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 468.13336, "r": 117.38329000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 468.13336, "r": 153.68701, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 468.13336, "r": 194.00566, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 468.13336, "r": 238.26950000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.698, "t": 468.01379, "r": 282.11386, "b": 476.97018, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 483.32635, "r": 102.08514, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87206, "t": 483.32635, "r": 153.69141, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 483.32635, "r": 194.00009, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 218.33870999999996, "t": 483.32635, "r": 240.75455999999997, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18411, "t": 483.32635, "r": 279.61865, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.165001, "t": 495.28134, "r": 101.5323, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86716, "t": 495.28134, "r": 153.68651, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62411, "t": 495.28134, "r": 186.94167, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88795000000002, "t": 495.28134, "r": 231.20551, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69855, "t": 495.28134, "r": 282.11441, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 71.789001, "t": 507.23633, "r": 111.90838999999998, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86221, "t": 507.23633, "r": 153.68156, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62914, "t": 507.23633, "r": 186.94669, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89297, "t": 507.23633, "r": 231.21053000000003, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.6936, "t": 507.23633, "r": 282.10947, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 519.1913099999999, "r": 117.38329000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 519.1913099999999, "r": 153.68701, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 519.1913099999999, "r": 194.00566, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 519.1913099999999, "r": 238.26950000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.189, "t": 519.0717500000001, "r": 279.62354, "b": 528.02814, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 536.49837, "r": 102.08514, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91064, "t": 536.49837, "r": 150.64285, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 536.49837, "r": 194.00009, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89285, "t": 536.49837, "r": 231.21040000000002, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18411, "t": 536.49837, "r": 279.61865, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 548.45436, "r": 117.38329000000002, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.90625, "t": 548.45436, "r": 150.63846, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 548.45436, "r": 194.00566, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88845999999998, "t": 548.45436, "r": 231.20601, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.189, "t": 548.3348100000001, "r": 279.62354, "b": 557.2911799999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 568.00237, "r": 117.38329000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 568.00237, "r": 153.68701, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 568.00237, "r": 194.00566, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 568.00237, "r": 238.26950000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.1897, "t": 568.00237, "r": 279.62424, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false } ] }, "8": { "label": "table", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "table", "bbox": { "l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT" }, "confidence": 0.9691730737686157, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.323, "t": 253.66436999999996, "r": 365.33536, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04132, "t": 253.66436999999996, "r": 430.91916, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.10214, "t": 253.66436999999996, "r": 474.58523999999994, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54034, "t": 253.66436999999996, "r": 527.2276, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.65601, "t": 270.62134000000003, "r": 377.00076, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.69809, "t": 270.62134000000003, "r": 438.28073, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.63559, "t": 270.62134000000003, "r": 473.07013, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.16592, "t": 270.62134000000003, "r": 515.60046, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.79501, "t": 282.57631999999995, "r": 377.86331, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69388, "t": 282.57631999999995, "r": 438.27652, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63101, "t": 282.45676, "r": 473.06555000000003, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.1713, "t": 282.45676, "r": 515.60583, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.79501, "t": 294.53131, "r": 377.86331, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.81842, "t": 294.53131, "r": 442.15194999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63135, "t": 294.53131, "r": 473.06589, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.22515999999996, "t": 294.53131, "r": 508.54268999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 4, "num_cols": 4, "table_cells": [ { "bbox": { "l": 339.323, "t": 253.66436999999996, "r": 365.33536, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 401.04132, "t": 253.66436999999996, "r": 430.91916, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 454.10214, "t": 253.66436999999996, "r": 474.58523999999994, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 486.54034, "t": 253.66436999999996, "r": 527.2276, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 327.65601, "t": 270.62134000000003, "r": 377.00076, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69809, "t": 270.62134000000003, "r": 438.28073, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63559, "t": 270.62134000000003, "r": 473.07013, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.16592, "t": 270.62134000000003, "r": 515.60046, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.79501, "t": 282.57631999999995, "r": 377.86331, "b": 291.48288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69388, "t": 282.57631999999995, "r": 438.27652, "b": 291.48288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63101, "t": 282.45676, "r": 473.06555000000003, "b": 291.41315, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.1713, "t": 282.45676, "r": 515.60583, "b": 291.41315, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.79501, "t": 294.53131, "r": 377.86331, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 389.81842, "t": 294.53131, "r": 442.15194999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63135, "t": 294.53131, "r": 473.06589, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 505.22515999999996, "t": 294.53131, "r": 508.54268999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false } ] }, "5": { "label": "table", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "table", "bbox": { "l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT" }, "confidence": 0.9775567650794983, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01099, "t": 552.23337, "r": 384.02335, "b": 561.1399200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03400000000005, "t": 546.25537, "r": 473.94049000000007, "b": 555.16193, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.50598, "t": 558.21037, "r": 436.73999, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.6951, "t": 558.21037, "r": 485.07849, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.3848, "t": 558.21037, "r": 512.117, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68201, "t": 575.16736, "r": 384.3519, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.90097, "t": 575.16736, "r": 431.33550999999994, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16479000000004, "t": 575.16736, "r": 475.59933000000007, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.0289, "t": 575.16736, "r": 514.46344, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72299, "t": 587.12236, "r": 391.31064, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.90582, "t": 587.12236, "r": 431.34036, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.16965, "t": 587.12236, "r": 475.60419, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03374999999994, "t": 587.12236, "r": 514.46832, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.13599, "t": 599.07835, "r": 387.89923, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.90161, "t": 599.07835, "r": 431.33615, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.16544, "t": 599.07835, "r": 475.59998, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.02954000000005, "t": 599.07835, "r": 514.46411, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.55899, "t": 611.03336, "r": 395.47534, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.90616, "t": 611.03336, "r": 431.34069999999997, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.16998000000007, "t": 611.03336, "r": 475.60452, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03409, "t": 611.03336, "r": 514.46863, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78101, "t": 622.9883600000001, "r": 381.25415, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.90158, "t": 622.9883600000001, "r": 431.33612, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.16541, "t": 622.9883600000001, "r": 475.59995000000004, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.0295100000001, "t": 622.9883600000001, "r": 514.46405, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.483, "t": 634.94336, "r": 396.5513, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.90616, "t": 634.94336, "r": 431.34069999999997, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.16998000000007, "t": 634.94336, "r": 475.60452, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03400000000005, "t": 634.82381, "r": 514.46857, "b": 643.78018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 4, "table_cells": [ { "bbox": { "l": 358.01099, "t": 552.23337, "r": 384.02335, "b": 561.1399200000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.03400000000005, "t": 546.25537, "r": 473.94049000000007, "b": 555.16193, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 408.50598, "t": 558.21037, "r": 436.73999, "b": 567.11693, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 499.3848, "t": 558.21037, "r": 512.117, "b": 567.11693, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 357.68201, "t": 575.16736, "r": 384.3519, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90097, "t": 575.16736, "r": 431.33550999999994, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16479000000004, "t": 575.16736, "r": 475.59933000000007, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.0289, "t": 575.16736, "r": 514.46344, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 350.72299, "t": 587.12236, "r": 391.31064, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90582, "t": 587.12236, "r": 431.34036, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16965, "t": 587.12236, "r": 475.60419, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03374999999994, "t": 587.12236, "r": 514.46832, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 354.13599, "t": 599.07835, "r": 387.89923, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90161, "t": 599.07835, "r": 431.33615, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16544, "t": 599.07835, "r": 475.59998, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.02954000000005, "t": 599.07835, "r": 514.46411, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 346.55899, "t": 611.03336, "r": 395.47534, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90616, "t": 611.03336, "r": 431.34069999999997, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16998000000007, "t": 611.03336, "r": 475.60452, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03409, "t": 611.03336, "r": 514.46863, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 360.78101, "t": 622.9883600000001, "r": 381.25415, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90158, "t": 622.9883600000001, "r": 431.33612, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16541, "t": 622.9883600000001, "r": 475.59995000000004, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.0295100000001, "t": 622.9883600000001, "r": 514.46405, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 345.483, "t": 634.94336, "r": 396.5513, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90616, "t": 634.94336, "r": 431.34069999999997, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16998000000007, "t": 634.94336, "r": 475.60452, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03400000000005, "t": 634.82381, "r": 514.46857, "b": 643.78018, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 50.112, "t": 74.40137000000016, "r": 167.89825, "b": 84.25342, "coord_origin": "TOPLEFT" }, "confidence": 0.9554274082183838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.25342, "r_x1": 63.704811, "r_y1": 84.25342, "r_x2": 63.704811, "r_y2": 74.40137000000016, "r_x3": 50.112, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.766685, "r_y0": 84.25342, "r_x1": 167.89825, "r_y1": 84.25342, "r_x2": 167.89825, "r_y2": 74.40137000000016, "r_x3": 72.766685, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3. Datasets and Metrics" }, { "label": "text", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 93.35039999999992, "r": 286.36511, "b": 138.12298999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9862998127937317, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 102.25696000000016, "r_x1": 286.36499, "r_y1": 102.25696000000016, "r_x2": 286.36499, "r_y2": 93.35039999999992, "r_x3": 62.067001, "r_y3": 93.35039999999992, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 114.21198000000015, "r_x1": 286.36511, "r_y1": 114.21198000000015, "r_x2": 286.36511, "r_y2": 105.30542000000003, "r_x3": 50.112, "r_y3": 105.30542000000003, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 126.16699000000006, "r_x1": 286.36505, "r_y1": 126.16699000000006, "r_x2": 286.36505, "r_y2": 117.26044000000002, "r_x3": 50.112, "r_y3": 117.26044000000002, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 138.12298999999996, "r_x1": 136.71687, "r_y1": 138.12298999999996, "r_x2": 136.71687, "r_y2": 129.21642999999995, "r_x3": 50.112, "r_y3": 129.21642999999995, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:" }, { "label": "formula", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "formula", "bbox": { "l": 86.218994, "t": 150.31799, "r": 286.3624, "b": 172.73877000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9500409364700317, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.218994, "r_y0": 165.90479000000005, "r_x1": 118.8784, "r_y1": 165.90479000000005, "r_x2": 118.8784, "r_y2": 157.05798000000004, "r_x3": 86.218994, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87499, "r_y0": 165.90479000000005, "r_x1": 143.26962, "r_y1": 165.90479000000005, "r_x2": 143.26962, "r_y2": 157.05798000000004, "r_x3": 118.87499, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.76799, "r_y0": 165.90479000000005, "r_x1": 165.9019, "r_y1": 165.90479000000005, "r_x2": 165.9019, "r_y2": 157.05798000000004, "r_x3": 143.76799, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12099, "r_y0": 165.90479000000005, "r_x1": 175.8699, "r_y1": 165.90479000000005, "r_x2": 175.8699, "r_y2": 156.50012000000004, "r_x3": 168.12099, "r_y3": 156.50012000000004, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.27899, "r_y0": 159.16479000000004, "r_x1": 221.95677, "r_y1": 159.16479000000004, "r_x2": 221.95677, "r_y2": 150.31799, "r_x3": 179.27899, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95200000000003, "r_y0": 159.16479000000004, "r_x1": 246.34663, "r_y1": 159.16479000000004, "r_x2": 246.34663, "r_y2": 150.31799, "r_x3": 221.95200000000003, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84499999999997, "r_y0": 159.16479000000004, "r_x1": 250.71945, "r_y1": 159.16479000000004, "r_x2": 250.71945, "r_y2": 150.31799, "r_x3": 246.84499999999997, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21201, "r_y0": 172.73877000000005, "r_x1": 206.29161, "r_y1": 172.73877000000005, "r_x2": 206.29161, "r_y2": 163.89197000000001, "r_x3": 182.21201, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.289, "r_y0": 172.73877000000005, "r_x1": 209.05661, "r_y1": 172.73877000000005, "r_x2": 209.05661, "r_y2": 163.33411, "r_x3": 206.289, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.056, "r_y0": 172.73877000000005, "r_x1": 219.19968, "r_y1": 172.73877000000005, "r_x2": 219.19968, "r_y2": 163.89197000000001, "r_x3": 209.056, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.69700999999998, "r_y0": 172.73877000000005, "r_x1": 222.46461000000002, "r_y1": 172.73877000000005, "r_x2": 222.46461000000002, "r_y2": 163.33411, "r_x3": 219.69700999999998, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.125, "r_y0": 172.73877000000005, "r_x1": 226.89261, "r_y1": 172.73877000000005, "r_x2": 226.89261, "r_y2": 163.89197000000001, "r_x3": 224.125, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55299000000002, "r_y0": 172.73877000000005, "r_x1": 231.3206, "r_y1": 172.73877000000005, "r_x2": 231.3206, "r_y2": 163.33411, "r_x3": 228.55299000000002, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.31999, "r_y0": 172.73877000000005, "r_x1": 240.64563, "r_y1": 172.73877000000005, "r_x2": 240.64563, "r_y2": 163.89197000000001, "r_x3": 231.31999, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.144, "r_y0": 172.73877000000005, "r_x1": 243.91161, "r_y1": 172.73877000000005, "r_x2": 243.91161, "r_y2": 163.33411, "r_x3": 241.144, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.911, "r_y0": 172.73877000000005, "r_x1": 247.78545, "r_y1": 172.73877000000005, "r_x2": 247.78545, "r_y2": 163.89197000000001, "r_x3": 243.911, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 166.12396, "r_x1": 286.3624, "r_y1": 166.12396, "r_x2": 286.3624, "r_y2": 157.21740999999997, "r_x3": 274.746, "r_y3": 157.21740999999997, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)" }, { "label": "text", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.111984, "t": 181.00298999999995, "r": 286.36285, "b": 213.97900000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9735319018363953, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 190.06897000000004, "r_x1": 86.405632, "r_y1": 190.06897000000004, "r_x2": 86.405632, "r_y2": 181.16241000000002, "r_x3": 62.067001, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.581001, "r_y0": 189.84978999999998, "r_x1": 98.724663, "r_y1": 189.84978999999998, "r_x2": 98.724663, "r_y2": 181.00298999999995, "r_x3": 88.581001, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.399, "r_y0": 190.06897000000004, "r_x1": 115.785, "r_y1": 190.06897000000004, "r_x2": 115.785, "r_y2": 181.16241000000002, "r_x3": 101.399, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.961, "r_y0": 189.84978999999998, "r_x1": 127.28664, "r_y1": 189.84978999999998, "r_x2": 127.28664, "r_y2": 181.00298999999995, "r_x3": 117.961, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.95999, "r_y0": 190.06897000000004, "r_x1": 286.36285, "r_y1": 190.06897000000004, "r_x2": 286.36285, "r_y2": 181.16241000000002, "r_x3": 129.95999, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 202.02399000000003, "r_x1": 252.78116000000003, "r_y1": 202.02399000000003, "r_x2": 252.78116000000003, "r_y2": 193.11743, "r_x3": 50.111992, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18201, "r_y0": 201.80480999999997, "r_x1": 257.94962, "r_y1": 201.80480999999997, "r_x2": 257.94962, "r_y2": 192.40015000000005, "r_x3": 255.18201, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.94901, "r_y0": 201.80480999999997, "r_x1": 263.77115, "r_y1": 201.80480999999997, "r_x2": 263.77115, "r_y2": 192.95800999999994, "r_x3": 257.94901, "r_y3": 192.95800999999994, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.155, "r_y0": 201.80480999999997, "r_x1": 267.92261, "r_y1": 201.80480999999997, "r_x2": 267.92261, "r_y2": 192.40015000000005, "r_x3": 265.155, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32199, "r_y0": 202.02399000000003, "r_x1": 286.36179, "r_y1": 202.02399000000003, "r_x2": 286.36179, "r_y2": 193.11743, "r_x3": 270.32199, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 213.97900000000004, "r_x1": 172.13388, "r_y1": 213.97900000000004, "r_x2": 172.13388, "r_y2": 205.07245, "r_x3": 50.111984, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62399, "r_y0": 213.75982999999997, "r_x1": 180.44614, "r_y1": 213.75982999999997, "r_x2": 180.44614, "r_y2": 204.91301999999996, "r_x3": 174.62399, "r_y3": 204.91301999999996, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.82899, "r_y0": 213.97900000000004, "r_x1": 184.31964, "r_y1": 213.97900000000004, "r_x2": 184.31964, "r_y2": 205.07245, "r_x3": 181.82899, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ." }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 50.112, "t": 224.81946000000005, "r": 170.45169, "b": 234.67151, "coord_origin": "TOPLEFT" }, "confidence": 0.9588837027549744, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 234.67151, "r_x1": 64.551605, "r_y1": 234.67151, "r_x2": 64.551605, "r_y2": 224.81946000000005, "r_x3": 50.112, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.178009, "r_y0": 234.67151, "r_x1": 170.45169, "r_y1": 234.67151, "r_x2": 170.45169, "r_y2": 224.81946000000005, "r_x3": 74.178009, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.4. Quantitative Analysis" }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.112, "t": 243.6499, "r": 286.36514, "b": 396.13794, "coord_origin": "TOPLEFT" }, "confidence": 0.9855090975761414, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.60626000000002, "r_x1": 105.32461, "r_y1": 252.60626000000002, "r_x2": 105.32461, "r_y2": 243.6499, "r_x3": 62.067001, "r_y3": 243.6499, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.12600000000002, "r_y0": 252.67602999999997, "r_x1": 184.68361, "r_y1": 252.67602999999997, "r_x2": 184.68361, "r_y2": 243.76946999999996, "r_x3": 112.12600000000002, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.4781, "r_y0": 252.67602999999997, "r_x1": 286.36188, "r_y1": 252.67602999999997, "r_x2": 286.36188, "r_y2": 243.76946999999996, "r_x3": 191.4781, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.63104, "r_x1": 286.36508, "r_y1": 264.63104, "r_x2": 286.36508, "r_y2": 255.72448999999995, "r_x3": 50.112, "r_y3": 255.72448999999995, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.58606, "r_x1": 286.36508, "r_y1": 276.58606, "r_x2": 286.36508, "r_y2": 267.67949999999996, "r_x3": 50.112, "r_y3": 267.67949999999996, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.54105, "r_x1": 286.36508, "r_y1": 288.54105, "r_x2": 286.36508, "r_y2": 279.63446, "r_x3": 50.112, "r_y3": 279.63446, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.49704, "r_x1": 286.36514, "r_y1": 300.49704, "r_x2": 286.36514, "r_y2": 291.59048, "r_x3": 50.112, "r_y3": 291.59048, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.45203000000004, "r_x1": 286.36508, "r_y1": 312.45203000000004, "r_x2": 286.36508, "r_y2": 303.54547, "r_x3": 50.112, "r_y3": 303.54547, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.40700999999996, "r_x1": 286.36505, "r_y1": 324.40700999999996, "r_x2": 286.36505, "r_y2": 315.50046, "r_x3": 50.112, "r_y3": 315.50046, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.362, "r_x1": 286.36508, "r_y1": 336.362, "r_x2": 286.36508, "r_y2": 327.45544, "r_x3": 50.112, "r_y3": 327.45544, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.31699000000003, "r_x1": 286.36508, "r_y1": 348.31699000000003, "r_x2": 286.36508, "r_y2": 339.41043, "r_x3": 50.112, "r_y3": 339.41043, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 360.27197, "r_x1": 286.36505, "r_y1": 360.27197, "r_x2": 286.36505, "r_y2": 351.36542, "r_x3": 50.112, "r_y3": 351.36542, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 372.2279700000001, "r_x1": 286.36508, "r_y1": 372.2279700000001, "r_x2": 286.36508, "r_y2": 363.32141, "r_x3": 50.112, "r_y3": 363.32141, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 384.18295000000006, "r_x1": 286.36511, "r_y1": 384.18295000000006, "r_x2": 286.36511, "r_y2": 375.2764, "r_x3": 50.112, "r_y3": 375.2764, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.13794, "r_x1": 170.01187, "r_y1": 396.13794, "r_x2": 170.01187, "r_y2": 387.23138, "r_x3": 50.112, "r_y3": 387.23138, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size." }, { "label": "table", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "table", "bbox": { "l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT" }, "confidence": 0.9892510175704956, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.843002, "t": 420.69037, "r": 104.85535, "b": 429.59692, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71237, "r": 236.10649, "b": 423.61893, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.338, "t": 426.66736, "r": 159.21584, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17096, "t": 426.66736, "r": 199.40497, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36009, "t": 426.66736, "r": 247.74349999999998, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54044, "t": 426.66736, "r": 277.27264, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.612, "t": 443.62436, "r": 102.08514, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87206, "t": 443.62436, "r": 153.69141, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.56554, "t": 443.62436, "r": 194.00009, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.82938000000001, "t": 443.62436, "r": 238.26393, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18414, "t": 443.62436, "r": 279.61868, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.165001, "t": 455.58035, "r": 101.5323, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.86716, "t": 455.58035, "r": 153.68651, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62411, "t": 455.58035, "r": 186.94167, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.88795000000002, "t": 455.58035, "r": 231.20551, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.69855, "t": 455.58035, "r": 282.11441, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.315002, "t": 468.13336, "r": 117.38329000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.86766, "t": 468.13336, "r": 153.68701, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57111, "t": 468.13336, "r": 194.00566, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83495, "t": 468.13336, "r": 238.26950000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.698, "t": 468.01379, "r": 282.11386, "b": 476.97018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.612, "t": 483.32635, "r": 102.08514, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87206, "t": 483.32635, "r": 153.69141, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.56554, "t": 483.32635, "r": 194.00009, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.33870999999996, "t": 483.32635, "r": 240.75455999999997, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18411, "t": 483.32635, "r": 279.61865, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.165001, "t": 495.28134, "r": 101.5323, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.86716, "t": 495.28134, "r": 153.68651, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62411, "t": 495.28134, "r": 186.94167, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.88795000000002, "t": 495.28134, "r": 231.20551, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.69855, "t": 495.28134, "r": 282.11441, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.789001, "t": 507.23633, "r": 111.90838999999998, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86221, "t": 507.23633, "r": 153.68156, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.62914, "t": 507.23633, "r": 186.94669, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89297, "t": 507.23633, "r": 231.21053000000003, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.6936, "t": 507.23633, "r": 282.10947, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.315002, "t": 519.1913099999999, "r": 117.38329000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.86766, "t": 519.1913099999999, "r": 153.68701, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57111, "t": 519.1913099999999, "r": 194.00566, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83495, "t": 519.1913099999999, "r": 238.26950000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.189, "t": 519.0717500000001, "r": 279.62354, "b": 528.02814, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.612, "t": 536.49837, "r": 102.08514, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91064, "t": 536.49837, "r": 150.64285, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.56554, "t": 536.49837, "r": 194.00009, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89285, "t": 536.49837, "r": 231.21040000000002, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18411, "t": 536.49837, "r": 279.61865, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.315002, "t": 548.45436, "r": 117.38329000000002, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.90625, "t": 548.45436, "r": 150.63846, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57111, "t": 548.45436, "r": 194.00566, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.88845999999998, "t": 548.45436, "r": 231.20601, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.189, "t": 548.3348100000001, "r": 279.62354, "b": 557.2911799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.315002, "t": 568.00237, "r": 117.38329000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.86766, "t": 568.00237, "r": 153.68701, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57111, "t": 568.00237, "r": 194.00566, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83495, "t": 568.00237, "r": 238.26950000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.1897, "t": 568.00237, "r": 279.62424, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 11, "num_cols": 5, "table_cells": [ { "bbox": { "l": 78.843002, "t": 420.69037, "r": 104.85535, "b": 429.59692, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 211.2, "t": 414.71237, "r": 236.10649, "b": 423.61893, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 129.338, "t": 426.66736, "r": 159.21584, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 171.17096, "t": 426.66736, "r": 199.40497, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 264.54044, "t": 426.66736, "r": 277.27264, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 443.62436, "r": 102.08514, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87206, "t": 443.62436, "r": 153.69141, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 443.62436, "r": 194.00009, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.82938000000001, "t": 443.62436, "r": 238.26393, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18414, "t": 443.62436, "r": 279.61868, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.165001, "t": 455.58035, "r": 101.5323, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86716, "t": 455.58035, "r": 153.68651, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62411, "t": 455.58035, "r": 186.94167, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88795000000002, "t": 455.58035, "r": 231.20551, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69855, "t": 455.58035, "r": 282.11441, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 468.13336, "r": 117.38329000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 468.13336, "r": 153.68701, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 468.13336, "r": 194.00566, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 468.13336, "r": 238.26950000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.698, "t": 468.01379, "r": 282.11386, "b": 476.97018, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 483.32635, "r": 102.08514, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87206, "t": 483.32635, "r": 153.69141, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 483.32635, "r": 194.00009, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 218.33870999999996, "t": 483.32635, "r": 240.75455999999997, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18411, "t": 483.32635, "r": 279.61865, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.165001, "t": 495.28134, "r": 101.5323, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86716, "t": 495.28134, "r": 153.68651, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62411, "t": 495.28134, "r": 186.94167, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88795000000002, "t": 495.28134, "r": 231.20551, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69855, "t": 495.28134, "r": 282.11441, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 71.789001, "t": 507.23633, "r": 111.90838999999998, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86221, "t": 507.23633, "r": 153.68156, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62914, "t": 507.23633, "r": 186.94669, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89297, "t": 507.23633, "r": 231.21053000000003, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.6936, "t": 507.23633, "r": 282.10947, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 519.1913099999999, "r": 117.38329000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 519.1913099999999, "r": 153.68701, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 519.1913099999999, "r": 194.00566, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 519.1913099999999, "r": 238.26950000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.189, "t": 519.0717500000001, "r": 279.62354, "b": 528.02814, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 536.49837, "r": 102.08514, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91064, "t": 536.49837, "r": 150.64285, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 536.49837, "r": 194.00009, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89285, "t": 536.49837, "r": 231.21040000000002, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18411, "t": 536.49837, "r": 279.61865, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 548.45436, "r": 117.38329000000002, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.90625, "t": 548.45436, "r": 150.63846, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 548.45436, "r": 194.00566, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88845999999998, "t": 548.45436, "r": 231.20601, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.189, "t": 548.3348100000001, "r": 279.62354, "b": 557.2911799999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 568.00237, "r": 117.38329000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 568.00237, "r": 153.68701, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 568.00237, "r": 194.00566, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 568.00237, "r": 238.26950000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.1897, "t": 568.00237, "r": 279.62424, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "text", "id": 15, "page_no": 6, "cluster": { "id": 15, "label": "text", "bbox": { "l": 50.112, "t": 592.43336, "r": 286.36511, "b": 613.29492, "coord_origin": "TOPLEFT" }, "confidence": 0.7209173440933228, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 601.33992, "r_x1": 286.36511, "r_y1": 601.33992, "r_x2": 286.36511, "r_y2": 592.43336, "r_x3": 50.112, "r_y3": 592.43336, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 613.29492, "r_x1": 247.46114, "r_y1": 613.29492, "r_x2": 247.46114, "r_y2": 604.38837, "r_x3": 50.112, "r_y3": 604.38837, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)." }, { "label": "text", "id": 16, "page_no": 6, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.112, "t": 616.34337, "r": 261.78732, "b": 625.24992, "coord_origin": "TOPLEFT" }, "confidence": 0.6433312892913818, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 625.24992, "r_x1": 261.78732, "r_y1": 625.24992, "r_x2": 261.78732, "r_y2": 616.34337, "r_x3": 50.112, "r_y3": 616.34337, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "FT: Model was trained on PubTabNet then finetuned." }, { "label": "text", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.112015, "t": 644.3498099999999, "r": 286.366, "b": 713.151932, "coord_origin": "TOPLEFT" }, "confidence": 0.9854635000228882, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 653.30618, "r_x1": 124.72179, "r_y1": 653.30618, "r_x2": 124.72179, "r_y2": 644.3498099999999, "r_x3": 62.067001, "r_y3": 644.3498099999999, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.20401, "r_y0": 653.37592, "r_x1": 242.9333, "r_y1": 653.37592, "r_x2": 242.9333, "r_y2": 644.46936, "r_x3": 128.20401, "r_y3": 644.46936, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55401999999998, "r_y0": 653.1467700000001, "r_x1": 286.36084, "r_y1": 653.1467700000001, "r_x2": 286.36084, "r_y2": 644.55902, "r_x3": 245.55401999999998, "r_y3": 644.55902, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.10178, "r_x1": 84.971146, "r_y1": 665.10178, "r_x2": 84.971146, "r_y2": 656.51402, "r_x3": 50.112015, "r_y3": 656.51402, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.515015, "r_y0": 665.33092, "r_x1": 286.366, "r_y1": 665.33092, "r_x2": 286.366, "r_y2": 656.42436, "r_x3": 89.515015, "r_y3": 656.42436, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28593, "r_x1": 286.36511, "r_y1": 677.28593, "r_x2": 286.36511, "r_y2": 668.37936, "r_x3": 50.112015, "r_y3": 668.37936, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24193, "r_x1": 286.36505, "r_y1": 689.24193, "r_x2": 286.36505, "r_y2": 680.33536, "r_x3": 50.112015, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.19693, "r_x1": 286.36511, "r_y1": 701.19693, "r_x2": 286.36511, "r_y2": 692.290359, "r_x3": 50.112015, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151932, "r_x1": 286.36508, "r_y1": 713.151932, "r_x2": 286.36508, "r_y2": 704.245361, "r_x3": 50.112015, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate" }, { "label": "text", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.862, "t": 75.20836999999995, "r": 545.11517, "b": 227.57709, "coord_origin": "TOPLEFT" }, "confidence": 0.9713197946548462, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 322.14215, "r_y1": 84.11492999999996, "r_x2": 322.14215, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45401, "r_y0": 83.88580000000002, "r_x1": 404.56702, "r_y1": 83.88580000000002, "r_x2": 404.56702, "r_y2": 75.29803000000004, "r_x3": 325.45401, "r_y3": 75.29803000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.104, "r_y0": 84.11492999999996, "r_x1": 545.10968, "r_y1": 84.11492999999996, "r_x2": 545.10968, "r_y2": 75.20836999999995, "r_x3": 408.104, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11511, "r_y1": 96.06994999999995, "r_x2": 545.11511, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 470.22626, "r_y1": 108.02495999999985, "r_x2": 470.22626, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.52884, "r_y0": 108.02495999999985, "r_x1": 545.11511, "r_y1": 108.02495999999985, "r_x2": 545.11511, "r_y2": 99.11841000000004, "r_x3": 477.52884, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 119.97997999999984, "r_x1": 545.11517, "r_y1": 119.97997999999984, "r_x2": 545.11517, "r_y2": 111.07343000000003, "r_x3": 308.862, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 131.93499999999995, "r_x1": 545.11511, "r_y1": 131.93499999999995, "r_x2": 545.11511, "r_y2": 123.02844000000005, "r_x3": 308.862, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 143.89099, "r_x1": 502.01691000000005, "r_y1": 143.89099, "r_x2": 502.01691000000005, "r_y2": 134.98443999999995, "r_x3": 308.862, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47299, "r_y0": 143.66187000000002, "r_x1": 545.11041, "r_y1": 143.66187000000002, "r_x2": 545.11041, "r_y2": 135.07410000000004, "r_x3": 504.47299, "r_y3": 135.07410000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 155.61688000000004, "r_x1": 343.16324, "r_y1": 155.61688000000004, "r_x2": 343.16324, "r_y2": 147.02910999999995, "r_x3": 308.862, "r_y3": 147.02910999999995, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.371, "r_y0": 155.84600999999998, "r_x1": 545.11493, "r_y1": 155.84600999999998, "r_x2": 545.11493, "r_y2": 146.93944999999997, "r_x3": 346.371, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 167.80102999999997, "r_x1": 446.15652, "r_y1": 167.80102999999997, "r_x2": 446.15652, "r_y2": 158.89446999999996, "r_x3": 308.862, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.28998000000007, "r_y0": 167.57190000000003, "r_x1": 525.04181, "r_y1": 167.57190000000003, "r_x2": 525.04181, "r_y2": 158.98413000000005, "r_x3": 448.28998000000007, "r_y3": 158.98413000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.39899, "r_y0": 167.80102999999997, "r_x1": 545.11249, "r_y1": 167.80102999999997, "r_x2": 545.11249, "r_y2": 158.89446999999996, "r_x3": 527.39899, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 179.75603999999998, "r_x1": 545.11511, "r_y1": 179.75603999999998, "r_x2": 545.11511, "r_y2": 170.84948999999995, "r_x3": 308.862, "r_y3": 170.84948999999995, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 191.71105999999997, "r_x1": 432.86642000000006, "r_y1": 191.71105999999997, "r_x2": 432.86642000000006, "r_y2": 182.80449999999996, "r_x3": 308.862, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39001, "r_y0": 191.48193000000003, "r_x1": 510.93021, "r_y1": 191.48193000000003, "r_x2": 510.93021, "r_y2": 182.89417000000003, "r_x3": 436.39001, "r_y3": 182.89417000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.677, "r_y0": 191.71105999999997, "r_x1": 545.11273, "r_y1": 191.71105999999997, "r_x2": 545.11273, "r_y2": 182.80449999999996, "r_x3": 514.677, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 203.66607999999997, "r_x1": 431.17285, "r_y1": 203.66607999999997, "r_x2": 431.17285, "r_y2": 194.75951999999995, "r_x3": 308.862, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6790199999999, "r_y0": 203.43695000000002, "r_x1": 514.18054, "r_y1": 203.43695000000002, "r_x2": 514.18054, "r_y2": 194.84918000000005, "r_x3": 434.6790199999999, "r_y3": 194.84918000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.17603, "r_y0": 203.66607999999997, "r_x1": 545.10992, "r_y1": 203.66607999999997, "r_x2": 545.10992, "r_y2": 194.75951999999995, "r_x3": 514.17603, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 215.39293999999995, "r_x1": 382.35614, "r_y1": 215.39293999999995, "r_x2": 382.35614, "r_y2": 206.80517999999995, "r_x3": 308.86203, "r_y3": 206.80517999999995, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.07501, "r_y0": 215.62207, "r_x1": 545.11426, "r_y1": 215.62207, "r_x2": 545.11426, "r_y2": 206.71551999999997, "r_x3": 385.07501, "r_y3": 206.71551999999997, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 227.57709, "r_x1": 501.6981799999999, "r_y1": 227.57709, "r_x2": 501.6981799999999, "r_y2": 218.67052999999999, "r_x3": 308.862, "r_y3": 218.67052999999999, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes." }, { "label": "table", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "table", "bbox": { "l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT" }, "confidence": 0.9691730737686157, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.323, "t": 253.66436999999996, "r": 365.33536, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04132, "t": 253.66436999999996, "r": 430.91916, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.10214, "t": 253.66436999999996, "r": 474.58523999999994, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54034, "t": 253.66436999999996, "r": 527.2276, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.65601, "t": 270.62134000000003, "r": 377.00076, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.69809, "t": 270.62134000000003, "r": 438.28073, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.63559, "t": 270.62134000000003, "r": 473.07013, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.16592, "t": 270.62134000000003, "r": 515.60046, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.79501, "t": 282.57631999999995, "r": 377.86331, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69388, "t": 282.57631999999995, "r": 438.27652, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63101, "t": 282.45676, "r": 473.06555000000003, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.1713, "t": 282.45676, "r": 515.60583, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.79501, "t": 294.53131, "r": 377.86331, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.81842, "t": 294.53131, "r": 442.15194999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63135, "t": 294.53131, "r": 473.06589, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.22515999999996, "t": 294.53131, "r": 508.54268999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 4, "num_cols": 4, "table_cells": [ { "bbox": { "l": 339.323, "t": 253.66436999999996, "r": 365.33536, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 401.04132, "t": 253.66436999999996, "r": 430.91916, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 454.10214, "t": 253.66436999999996, "r": 474.58523999999994, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 486.54034, "t": 253.66436999999996, "r": 527.2276, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 327.65601, "t": 270.62134000000003, "r": 377.00076, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69809, "t": 270.62134000000003, "r": 438.28073, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63559, "t": 270.62134000000003, "r": 473.07013, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.16592, "t": 270.62134000000003, "r": 515.60046, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.79501, "t": 282.57631999999995, "r": 377.86331, "b": 291.48288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69388, "t": 282.57631999999995, "r": 438.27652, "b": 291.48288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63101, "t": 282.45676, "r": 473.06555000000003, "b": 291.41315, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.1713, "t": 282.45676, "r": 515.60583, "b": 291.41315, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.79501, "t": 294.53131, "r": 377.86331, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 389.81842, "t": 294.53131, "r": 442.15194999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63135, "t": 294.53131, "r": 473.06589, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 505.22515999999996, "t": 294.53131, "r": 508.54268999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "caption", "bbox": { "l": 308.862, "t": 316.44931, "r": 545.11517, "b": 337.3108500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9519917964935303, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 325.35587, "r_x1": 341.49951, "r_y1": 325.35587, "r_x2": 341.49951, "r_y2": 316.44931, "r_x3": 308.862, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.60284, "r_y0": 325.35587, "r_x1": 545.11517, "r_y1": 325.35587, "r_x2": 545.11517, "r_y2": 316.44931, "r_x3": 348.60284, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.3108500000001, "r_x1": 474.97845, "r_y1": 337.3108500000001, "r_x2": 474.97845, "r_y2": 328.4043, "r_x3": 308.862, "r_y3": 328.4043, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing." }, { "label": "text", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86197, "t": 367.6797199999999, "r": 545.11566, "b": 520.16769, "coord_origin": "TOPLEFT" }, "confidence": 0.9835010766983032, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 376.63611, "r_x1": 378.94876, "r_y1": 376.63611, "r_x2": 378.94876, "r_y2": 367.6797199999999, "r_x3": 320.81699, "r_y3": 367.6797199999999, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.07898, "r_y0": 376.70584, "r_x1": 545.11566, "r_y1": 376.70584, "r_x2": 545.11566, "r_y2": 367.79929, "r_x3": 387.07898, "r_y3": 367.79929, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 388.66083, "r_x1": 487.19257, "r_y1": 388.66083, "r_x2": 487.19257, "r_y2": 379.75426999999996, "r_x3": 308.86197, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.96713, "r_y0": 388.66083, "r_x1": 545.11511, "r_y1": 388.66083, "r_x2": 545.11511, "r_y2": 379.75426999999996, "r_x3": 493.96713, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 400.61581, "r_x1": 545.11505, "r_y1": 400.61581, "r_x2": 545.11505, "r_y2": 391.70926, "r_x3": 308.86197, "r_y3": 391.70926, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 412.57181, "r_x1": 545.11523, "r_y1": 412.57181, "r_x2": 545.11523, "r_y2": 403.66525, "r_x3": 308.86197, "r_y3": 403.66525, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 424.52679, "r_x1": 314.08096, "r_y1": 424.52679, "r_x2": 314.08096, "r_y2": 415.62024, "r_x3": 308.86197, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69046, "r_y0": 424.52679, "r_x1": 545.11517, "r_y1": 424.52679, "r_x2": 545.11517, "r_y2": 415.62024, "r_x3": 316.69046, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 436.48177999999996, "r_x1": 545.11505, "r_y1": 436.48177999999996, "r_x2": 545.11505, "r_y2": 427.57523, "r_x3": 308.86197, "r_y3": 427.57523, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 448.43677, "r_x1": 545.11505, "r_y1": 448.43677, "r_x2": 545.11505, "r_y2": 439.53021, "r_x3": 308.86197, "r_y3": 439.53021, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 460.39175, "r_x1": 350.23666, "r_y1": 460.39175, "r_x2": 350.23666, "r_y2": 451.4852, "r_x3": 308.86197, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.17596, "r_y0": 460.32201999999995, "r_x1": 374.59183, "r_y1": 460.32201999999995, "r_x2": 374.59183, "r_y2": 451.36563, "r_x3": 352.17596, "r_y3": 451.36563, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53296, "r_y0": 460.39175, "r_x1": 545.11011, "r_y1": 460.39175, "r_x2": 545.11011, "r_y2": 451.4852, "r_x3": 376.53296, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 472.34674, "r_x1": 545.11511, "r_y1": 472.34674, "r_x2": 545.11511, "r_y2": 463.44019, "r_x3": 308.86197, "r_y3": 463.44019, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 484.30273, "r_x1": 545.11517, "r_y1": 484.30273, "r_x2": 545.11517, "r_y2": 475.39618, "r_x3": 308.86197, "r_y3": 475.39618, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 496.25772, "r_x1": 545.11511, "r_y1": 496.25772, "r_x2": 545.11511, "r_y2": 487.35117, "r_x3": 308.86197, "r_y3": 487.35117, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 508.21271, "r_x1": 545.11505, "r_y1": 508.21271, "r_x2": 545.11505, "r_y2": 499.30615, "r_x3": 308.86197, "r_y3": 499.30615, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 520.16769, "r_x1": 405.69846, "r_y1": 520.16769, "r_x2": 405.69846, "r_y2": 511.26114, "r_x3": 308.86197, "r_y3": 511.26114, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations." }, { "label": "table", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "table", "bbox": { "l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT" }, "confidence": 0.9775567650794983, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01099, "t": 552.23337, "r": 384.02335, "b": 561.1399200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03400000000005, "t": 546.25537, "r": 473.94049000000007, "b": 555.16193, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.50598, "t": 558.21037, "r": 436.73999, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.6951, "t": 558.21037, "r": 485.07849, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.3848, "t": 558.21037, "r": 512.117, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68201, "t": 575.16736, "r": 384.3519, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.90097, "t": 575.16736, "r": 431.33550999999994, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16479000000004, "t": 575.16736, "r": 475.59933000000007, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.0289, "t": 575.16736, "r": 514.46344, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72299, "t": 587.12236, "r": 391.31064, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.90582, "t": 587.12236, "r": 431.34036, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.16965, "t": 587.12236, "r": 475.60419, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03374999999994, "t": 587.12236, "r": 514.46832, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.13599, "t": 599.07835, "r": 387.89923, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.90161, "t": 599.07835, "r": 431.33615, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.16544, "t": 599.07835, "r": 475.59998, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.02954000000005, "t": 599.07835, "r": 514.46411, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.55899, "t": 611.03336, "r": 395.47534, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.90616, "t": 611.03336, "r": 431.34069999999997, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.16998000000007, "t": 611.03336, "r": 475.60452, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03409, "t": 611.03336, "r": 514.46863, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78101, "t": 622.9883600000001, "r": 381.25415, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.90158, "t": 622.9883600000001, "r": 431.33612, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.16541, "t": 622.9883600000001, "r": 475.59995000000004, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.0295100000001, "t": 622.9883600000001, "r": 514.46405, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.483, "t": 634.94336, "r": 396.5513, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.90616, "t": 634.94336, "r": 431.34069999999997, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.16998000000007, "t": 634.94336, "r": 475.60452, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03400000000005, "t": 634.82381, "r": 514.46857, "b": 643.78018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 4, "table_cells": [ { "bbox": { "l": 358.01099, "t": 552.23337, "r": 384.02335, "b": 561.1399200000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.03400000000005, "t": 546.25537, "r": 473.94049000000007, "b": 555.16193, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 408.50598, "t": 558.21037, "r": 436.73999, "b": 567.11693, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 499.3848, "t": 558.21037, "r": 512.117, "b": 567.11693, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 357.68201, "t": 575.16736, "r": 384.3519, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90097, "t": 575.16736, "r": 431.33550999999994, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16479000000004, "t": 575.16736, "r": 475.59933000000007, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.0289, "t": 575.16736, "r": 514.46344, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 350.72299, "t": 587.12236, "r": 391.31064, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90582, "t": 587.12236, "r": 431.34036, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16965, "t": 587.12236, "r": 475.60419, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03374999999994, "t": 587.12236, "r": 514.46832, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 354.13599, "t": 599.07835, "r": 387.89923, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90161, "t": 599.07835, "r": 431.33615, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16544, "t": 599.07835, "r": 475.59998, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.02954000000005, "t": 599.07835, "r": 514.46411, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 346.55899, "t": 611.03336, "r": 395.47534, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90616, "t": 611.03336, "r": 431.34069999999997, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16998000000007, "t": 611.03336, "r": 475.60452, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03409, "t": 611.03336, "r": 514.46863, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 360.78101, "t": 622.9883600000001, "r": 381.25415, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90158, "t": 622.9883600000001, "r": 431.33612, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16541, "t": 622.9883600000001, "r": 475.59995000000004, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.0295100000001, "t": 622.9883600000001, "r": 514.46405, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 345.483, "t": 634.94336, "r": 396.5513, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90616, "t": 634.94336, "r": 431.34069999999997, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16998000000007, "t": 634.94336, "r": 475.60452, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03400000000005, "t": 634.82381, "r": 514.46857, "b": 643.78018, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.862, "t": 656.86136, "r": 545.11517, "b": 689.6779300000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9541404247283936, "cells": [ { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.76792, "r_x1": 341.73862, "r_y1": 665.76792, "r_x2": 341.73862, "r_y2": 656.86136, "r_x3": 308.862, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.55927, "r_y0": 665.76792, "r_x1": 545.11517, "r_y1": 665.76792, "r_x2": 545.11517, "r_y2": 656.86136, "r_x3": 349.55927, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.7229199999999, "r_x1": 545.11505, "r_y1": 677.7229199999999, "r_x2": 545.11505, "r_y2": 668.81636, "r_x3": 308.862, "r_y3": 668.81636, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.6779300000001, "r_x1": 435.03836, "r_y1": 689.6779300000001, "r_x2": 435.03836, "r_y2": 680.77136, "r_x3": 308.862, "r_y3": 680.77136, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables." }, { "label": "page_footer", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133358, "r": 300.10229, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.8787972331047058, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039921, "r_x1": 300.10229, "r_y1": 743.039921, "r_x2": 300.10229, "r_y2": 734.133358, "r_x3": 295.121, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" } ], "body": [ { "label": "section_header", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 50.112, "t": 74.40137000000016, "r": 167.89825, "b": 84.25342, "coord_origin": "TOPLEFT" }, "confidence": 0.9554274082183838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.25342, "r_x1": 63.704811, "r_y1": 84.25342, "r_x2": 63.704811, "r_y2": 74.40137000000016, "r_x3": 50.112, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.766685, "r_y0": 84.25342, "r_x1": 167.89825, "r_y1": 84.25342, "r_x2": 167.89825, "r_y2": 74.40137000000016, "r_x3": 72.766685, "r_y3": 74.40137000000016, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3. Datasets and Metrics" }, { "label": "text", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 93.35039999999992, "r": 286.36511, "b": 138.12298999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9862998127937317, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 102.25696000000016, "r_x1": 286.36499, "r_y1": 102.25696000000016, "r_x2": 286.36499, "r_y2": 93.35039999999992, "r_x3": 62.067001, "r_y3": 93.35039999999992, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 114.21198000000015, "r_x1": 286.36511, "r_y1": 114.21198000000015, "r_x2": 286.36511, "r_y2": 105.30542000000003, "r_x3": 50.112, "r_y3": 105.30542000000003, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 126.16699000000006, "r_x1": 286.36505, "r_y1": 126.16699000000006, "r_x2": 286.36505, "r_y2": 117.26044000000002, "r_x3": 50.112, "r_y3": 117.26044000000002, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 138.12298999999996, "r_x1": 136.71687, "r_y1": 138.12298999999996, "r_x2": 136.71687, "r_y2": 129.21642999999995, "r_x3": 50.112, "r_y3": 129.21642999999995, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:" }, { "label": "formula", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "formula", "bbox": { "l": 86.218994, "t": 150.31799, "r": 286.3624, "b": 172.73877000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9500409364700317, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.218994, "r_y0": 165.90479000000005, "r_x1": 118.8784, "r_y1": 165.90479000000005, "r_x2": 118.8784, "r_y2": 157.05798000000004, "r_x3": 86.218994, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87499, "r_y0": 165.90479000000005, "r_x1": 143.26962, "r_y1": 165.90479000000005, "r_x2": 143.26962, "r_y2": 157.05798000000004, "r_x3": 118.87499, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.76799, "r_y0": 165.90479000000005, "r_x1": 165.9019, "r_y1": 165.90479000000005, "r_x2": 165.9019, "r_y2": 157.05798000000004, "r_x3": 143.76799, "r_y3": 157.05798000000004, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12099, "r_y0": 165.90479000000005, "r_x1": 175.8699, "r_y1": 165.90479000000005, "r_x2": 175.8699, "r_y2": 156.50012000000004, "r_x3": 168.12099, "r_y3": 156.50012000000004, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.27899, "r_y0": 159.16479000000004, "r_x1": 221.95677, "r_y1": 159.16479000000004, "r_x2": 221.95677, "r_y2": 150.31799, "r_x3": 179.27899, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95200000000003, "r_y0": 159.16479000000004, "r_x1": 246.34663, "r_y1": 159.16479000000004, "r_x2": 246.34663, "r_y2": 150.31799, "r_x3": 221.95200000000003, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84499999999997, "r_y0": 159.16479000000004, "r_x1": 250.71945, "r_y1": 159.16479000000004, "r_x2": 250.71945, "r_y2": 150.31799, "r_x3": 246.84499999999997, "r_y3": 150.31799, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21201, "r_y0": 172.73877000000005, "r_x1": 206.29161, "r_y1": 172.73877000000005, "r_x2": 206.29161, "r_y2": 163.89197000000001, "r_x3": 182.21201, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.289, "r_y0": 172.73877000000005, "r_x1": 209.05661, "r_y1": 172.73877000000005, "r_x2": 209.05661, "r_y2": 163.33411, "r_x3": 206.289, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.056, "r_y0": 172.73877000000005, "r_x1": 219.19968, "r_y1": 172.73877000000005, "r_x2": 219.19968, "r_y2": 163.89197000000001, "r_x3": 209.056, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.69700999999998, "r_y0": 172.73877000000005, "r_x1": 222.46461000000002, "r_y1": 172.73877000000005, "r_x2": 222.46461000000002, "r_y2": 163.33411, "r_x3": 219.69700999999998, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.125, "r_y0": 172.73877000000005, "r_x1": 226.89261, "r_y1": 172.73877000000005, "r_x2": 226.89261, "r_y2": 163.89197000000001, "r_x3": 224.125, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55299000000002, "r_y0": 172.73877000000005, "r_x1": 231.3206, "r_y1": 172.73877000000005, "r_x2": 231.3206, "r_y2": 163.33411, "r_x3": 228.55299000000002, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.31999, "r_y0": 172.73877000000005, "r_x1": 240.64563, "r_y1": 172.73877000000005, "r_x2": 240.64563, "r_y2": 163.89197000000001, "r_x3": 231.31999, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.144, "r_y0": 172.73877000000005, "r_x1": 243.91161, "r_y1": 172.73877000000005, "r_x2": 243.91161, "r_y2": 163.33411, "r_x3": 241.144, "r_y3": 163.33411, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.911, "r_y0": 172.73877000000005, "r_x1": 247.78545, "r_y1": 172.73877000000005, "r_x2": 247.78545, "r_y2": 163.89197000000001, "r_x3": 243.911, "r_y3": 163.89197000000001, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 166.12396, "r_x1": 286.3624, "r_y1": 166.12396, "r_x2": 286.3624, "r_y2": 157.21740999999997, "r_x3": 274.746, "r_y3": 157.21740999999997, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)" }, { "label": "text", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.111984, "t": 181.00298999999995, "r": 286.36285, "b": 213.97900000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9735319018363953, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 190.06897000000004, "r_x1": 86.405632, "r_y1": 190.06897000000004, "r_x2": 86.405632, "r_y2": 181.16241000000002, "r_x3": 62.067001, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.581001, "r_y0": 189.84978999999998, "r_x1": 98.724663, "r_y1": 189.84978999999998, "r_x2": 98.724663, "r_y2": 181.00298999999995, "r_x3": 88.581001, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.399, "r_y0": 190.06897000000004, "r_x1": 115.785, "r_y1": 190.06897000000004, "r_x2": 115.785, "r_y2": 181.16241000000002, "r_x3": 101.399, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.961, "r_y0": 189.84978999999998, "r_x1": 127.28664, "r_y1": 189.84978999999998, "r_x2": 127.28664, "r_y2": 181.00298999999995, "r_x3": 117.961, "r_y3": 181.00298999999995, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.95999, "r_y0": 190.06897000000004, "r_x1": 286.36285, "r_y1": 190.06897000000004, "r_x2": 286.36285, "r_y2": 181.16241000000002, "r_x3": 129.95999, "r_y3": 181.16241000000002, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 202.02399000000003, "r_x1": 252.78116000000003, "r_y1": 202.02399000000003, "r_x2": 252.78116000000003, "r_y2": 193.11743, "r_x3": 50.111992, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18201, "r_y0": 201.80480999999997, "r_x1": 257.94962, "r_y1": 201.80480999999997, "r_x2": 257.94962, "r_y2": 192.40015000000005, "r_x3": 255.18201, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.94901, "r_y0": 201.80480999999997, "r_x1": 263.77115, "r_y1": 201.80480999999997, "r_x2": 263.77115, "r_y2": 192.95800999999994, "r_x3": 257.94901, "r_y3": 192.95800999999994, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.155, "r_y0": 201.80480999999997, "r_x1": 267.92261, "r_y1": 201.80480999999997, "r_x2": 267.92261, "r_y2": 192.40015000000005, "r_x3": 265.155, "r_y3": 192.40015000000005, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32199, "r_y0": 202.02399000000003, "r_x1": 286.36179, "r_y1": 202.02399000000003, "r_x2": 286.36179, "r_y2": 193.11743, "r_x3": 270.32199, "r_y3": 193.11743, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 213.97900000000004, "r_x1": 172.13388, "r_y1": 213.97900000000004, "r_x2": 172.13388, "r_y2": 205.07245, "r_x3": 50.111984, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62399, "r_y0": 213.75982999999997, "r_x1": 180.44614, "r_y1": 213.75982999999997, "r_x2": 180.44614, "r_y2": 204.91301999999996, "r_x3": 174.62399, "r_y3": 204.91301999999996, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.82899, "r_y0": 213.97900000000004, "r_x1": 184.31964, "r_y1": 213.97900000000004, "r_x2": 184.31964, "r_y2": 205.07245, "r_x3": 181.82899, "r_y3": 205.07245, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ." }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 50.112, "t": 224.81946000000005, "r": 170.45169, "b": 234.67151, "coord_origin": "TOPLEFT" }, "confidence": 0.9588837027549744, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 234.67151, "r_x1": 64.551605, "r_y1": 234.67151, "r_x2": 64.551605, "r_y2": 224.81946000000005, "r_x3": 50.112, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.178009, "r_y0": 234.67151, "r_x1": 170.45169, "r_y1": 234.67151, "r_x2": 170.45169, "r_y2": 224.81946000000005, "r_x3": 74.178009, "r_y3": 224.81946000000005, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.4. Quantitative Analysis" }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.112, "t": 243.6499, "r": 286.36514, "b": 396.13794, "coord_origin": "TOPLEFT" }, "confidence": 0.9855090975761414, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 252.60626000000002, "r_x1": 105.32461, "r_y1": 252.60626000000002, "r_x2": 105.32461, "r_y2": 243.6499, "r_x3": 62.067001, "r_y3": 243.6499, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.12600000000002, "r_y0": 252.67602999999997, "r_x1": 184.68361, "r_y1": 252.67602999999997, "r_x2": 184.68361, "r_y2": 243.76946999999996, "r_x3": 112.12600000000002, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.4781, "r_y0": 252.67602999999997, "r_x1": 286.36188, "r_y1": 252.67602999999997, "r_x2": 286.36188, "r_y2": 243.76946999999996, "r_x3": 191.4781, "r_y3": 243.76946999999996, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 264.63104, "r_x1": 286.36508, "r_y1": 264.63104, "r_x2": 286.36508, "r_y2": 255.72448999999995, "r_x3": 50.112, "r_y3": 255.72448999999995, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 276.58606, "r_x1": 286.36508, "r_y1": 276.58606, "r_x2": 286.36508, "r_y2": 267.67949999999996, "r_x3": 50.112, "r_y3": 267.67949999999996, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 288.54105, "r_x1": 286.36508, "r_y1": 288.54105, "r_x2": 286.36508, "r_y2": 279.63446, "r_x3": 50.112, "r_y3": 279.63446, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.49704, "r_x1": 286.36514, "r_y1": 300.49704, "r_x2": 286.36514, "r_y2": 291.59048, "r_x3": 50.112, "r_y3": 291.59048, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.45203000000004, "r_x1": 286.36508, "r_y1": 312.45203000000004, "r_x2": 286.36508, "r_y2": 303.54547, "r_x3": 50.112, "r_y3": 303.54547, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 324.40700999999996, "r_x1": 286.36505, "r_y1": 324.40700999999996, "r_x2": 286.36505, "r_y2": 315.50046, "r_x3": 50.112, "r_y3": 315.50046, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 336.362, "r_x1": 286.36508, "r_y1": 336.362, "r_x2": 286.36508, "r_y2": 327.45544, "r_x3": 50.112, "r_y3": 327.45544, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 348.31699000000003, "r_x1": 286.36508, "r_y1": 348.31699000000003, "r_x2": 286.36508, "r_y2": 339.41043, "r_x3": 50.112, "r_y3": 339.41043, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 360.27197, "r_x1": 286.36505, "r_y1": 360.27197, "r_x2": 286.36505, "r_y2": 351.36542, "r_x3": 50.112, "r_y3": 351.36542, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 372.2279700000001, "r_x1": 286.36508, "r_y1": 372.2279700000001, "r_x2": 286.36508, "r_y2": 363.32141, "r_x3": 50.112, "r_y3": 363.32141, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 384.18295000000006, "r_x1": 286.36511, "r_y1": 384.18295000000006, "r_x2": 286.36511, "r_y2": 375.2764, "r_x3": 50.112, "r_y3": 375.2764, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 396.13794, "r_x1": 170.01187, "r_y1": 396.13794, "r_x2": 170.01187, "r_y2": 387.23138, "r_x3": 50.112, "r_y3": 387.23138, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size." }, { "label": "table", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "table", "bbox": { "l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT" }, "confidence": 0.9892510175704956, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.843002, "t": 420.69037, "r": 104.85535, "b": 429.59692, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.843002, "r_y0": 429.59692, "r_x1": 104.85535, "r_y1": 429.59692, "r_x2": 104.85535, "r_y2": 420.69037, "r_x3": 78.843002, "r_y3": 420.69037, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71237, "r": 236.10649, "b": 423.61893, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.61893, "r_x1": 236.10649, "r_y1": 423.61893, "r_x2": 236.10649, "r_y2": 414.71237, "r_x3": 211.2, "r_y3": 414.71237, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.338, "t": 426.66736, "r": 159.21584, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.338, "r_y0": 435.57391000000007, "r_x1": 159.21584, "r_y1": 435.57391000000007, "r_x2": 159.21584, "r_y2": 426.66736, "r_x3": 129.338, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17096, "t": 426.66736, "r": 199.40497, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17096, "r_y0": 435.57391000000007, "r_x1": 199.40497, "r_y1": 435.57391000000007, "r_x2": 199.40497, "r_y2": 426.66736, "r_x3": 171.17096, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36009, "t": 426.66736, "r": 247.74349999999998, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36009, "r_y0": 435.57391000000007, "r_x1": 247.74349999999998, "r_y1": 435.57391000000007, "r_x2": 247.74349999999998, "r_y2": 426.66736, "r_x3": 211.36009, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54044, "t": 426.66736, "r": 277.27264, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54044, "r_y0": 435.57391000000007, "r_x1": 277.27264, "r_y1": 435.57391000000007, "r_x2": 277.27264, "r_y2": 426.66736, "r_x3": 264.54044, "r_y3": 426.66736, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.612, "t": 443.62436, "r": 102.08514, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 452.53091, "r_x1": 102.08514, "r_y1": 452.53091, "r_x2": 102.08514, "r_y2": 443.62436, "r_x3": 81.612, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87206, "t": 443.62436, "r": 153.69141, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 452.53091, "r_x1": 153.69141, "r_y1": 452.53091, "r_x2": 153.69141, "r_y2": 443.62436, "r_x3": 134.87206, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.56554, "t": 443.62436, "r": 194.00009, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 452.53091, "r_x1": 194.00009, "r_y1": 452.53091, "r_x2": 194.00009, "r_y2": 443.62436, "r_x3": 176.56554, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.82938000000001, "t": 443.62436, "r": 238.26393, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.82938000000001, "r_y0": 452.53091, "r_x1": 238.26393, "r_y1": 452.53091, "r_x2": 238.26393, "r_y2": 443.62436, "r_x3": 220.82938000000001, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18414, "t": 443.62436, "r": 279.61868, "b": 452.53091, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18414, "r_y0": 452.53091, "r_x1": 279.61868, "r_y1": 452.53091, "r_x2": 279.61868, "r_y2": 443.62436, "r_x3": 262.18414, "r_y3": 443.62436, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.165001, "t": 455.58035, "r": 101.5323, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 464.48691, "r_x1": 101.5323, "r_y1": 464.48691, "r_x2": 101.5323, "r_y2": 455.58035, "r_x3": 82.165001, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.86716, "t": 455.58035, "r": 153.68651, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 464.48691, "r_x1": 153.68651, "r_y1": 464.48691, "r_x2": 153.68651, "r_y2": 455.58035, "r_x3": 134.86716, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62411, "t": 455.58035, "r": 186.94167, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 464.48691, "r_x1": 186.94167, "r_y1": 464.48691, "r_x2": 186.94167, "r_y2": 455.58035, "r_x3": 183.62411, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.88795000000002, "t": 455.58035, "r": 231.20551, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 464.48691, "r_x1": 231.20551, "r_y1": 464.48691, "r_x2": 231.20551, "r_y2": 455.58035, "r_x3": 227.88795000000002, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.69855, "t": 455.58035, "r": 282.11441, "b": 464.48691, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 464.48691, "r_x1": 282.11441, "r_y1": 464.48691, "r_x2": 282.11441, "r_y2": 455.58035, "r_x3": 259.69855, "r_y3": 455.58035, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.315002, "t": 468.13336, "r": 117.38329000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 477.03992, "r_x1": 117.38329000000002, "r_y1": 477.03992, "r_x2": 117.38329000000002, "r_y2": 468.13336, "r_x3": 66.315002, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.86766, "t": 468.13336, "r": 153.68701, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 477.03992, "r_x1": 153.68701, "r_y1": 477.03992, "r_x2": 153.68701, "r_y2": 468.13336, "r_x3": 134.86766, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57111, "t": 468.13336, "r": 194.00566, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 477.03992, "r_x1": 194.00566, "r_y1": 477.03992, "r_x2": 194.00566, "r_y2": 468.13336, "r_x3": 176.57111, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83495, "t": 468.13336, "r": 238.26950000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 477.03992, "r_x1": 238.26950000000002, "r_y1": 477.03992, "r_x2": 238.26950000000002, "r_y2": 468.13336, "r_x3": 220.83495, "r_y3": 468.13336, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.698, "t": 468.01379, "r": 282.11386, "b": 476.97018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.698, "r_y0": 476.97018, "r_x1": 282.11386, "r_y1": 476.97018, "r_x2": 282.11386, "r_y2": 468.01379, "r_x3": 259.698, "r_y3": 468.01379, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.612, "t": 483.32635, "r": 102.08514, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 492.23291, "r_x1": 102.08514, "r_y1": 492.23291, "r_x2": 102.08514, "r_y2": 483.32635, "r_x3": 81.612, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87206, "t": 483.32635, "r": 153.69141, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87206, "r_y0": 492.23291, "r_x1": 153.69141, "r_y1": 492.23291, "r_x2": 153.69141, "r_y2": 483.32635, "r_x3": 134.87206, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.56554, "t": 483.32635, "r": 194.00009, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 492.23291, "r_x1": 194.00009, "r_y1": 492.23291, "r_x2": 194.00009, "r_y2": 483.32635, "r_x3": 176.56554, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.33870999999996, "t": 483.32635, "r": 240.75455999999997, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.33870999999996, "r_y0": 492.23291, "r_x1": 240.75455999999997, "r_y1": 492.23291, "r_x2": 240.75455999999997, "r_y2": 483.32635, "r_x3": 218.33870999999996, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18411, "t": 483.32635, "r": 279.61865, "b": 492.23291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 492.23291, "r_x1": 279.61865, "r_y1": 492.23291, "r_x2": 279.61865, "r_y2": 483.32635, "r_x3": 262.18411, "r_y3": 483.32635, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.165001, "t": 495.28134, "r": 101.5323, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.165001, "r_y0": 504.1879, "r_x1": 101.5323, "r_y1": 504.1879, "r_x2": 101.5323, "r_y2": 495.28134, "r_x3": 82.165001, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.86716, "t": 495.28134, "r": 153.68651, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86716, "r_y0": 504.1879, "r_x1": 153.68651, "r_y1": 504.1879, "r_x2": 153.68651, "r_y2": 495.28134, "r_x3": 134.86716, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62411, "t": 495.28134, "r": 186.94167, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62411, "r_y0": 504.1879, "r_x1": 186.94167, "r_y1": 504.1879, "r_x2": 186.94167, "r_y2": 495.28134, "r_x3": 183.62411, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.88795000000002, "t": 495.28134, "r": 231.20551, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88795000000002, "r_y0": 504.1879, "r_x1": 231.20551, "r_y1": 504.1879, "r_x2": 231.20551, "r_y2": 495.28134, "r_x3": 227.88795000000002, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.69855, "t": 495.28134, "r": 282.11441, "b": 504.1879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69855, "r_y0": 504.1879, "r_x1": 282.11441, "r_y1": 504.1879, "r_x2": 282.11441, "r_y2": 495.28134, "r_x3": 259.69855, "r_y3": 495.28134, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.789001, "t": 507.23633, "r": 111.90838999999998, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.789001, "r_y0": 516.14288, "r_x1": 111.90838999999998, "r_y1": 516.14288, "r_x2": 111.90838999999998, "r_y2": 507.23633, "r_x3": 71.789001, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86221, "t": 507.23633, "r": 153.68156, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86221, "r_y0": 516.14288, "r_x1": 153.68156, "r_y1": 516.14288, "r_x2": 153.68156, "r_y2": 507.23633, "r_x3": 134.86221, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.62914, "t": 507.23633, "r": 186.94669, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62914, "r_y0": 516.14288, "r_x1": 186.94669, "r_y1": 516.14288, "r_x2": 186.94669, "r_y2": 507.23633, "r_x3": 183.62914, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89297, "t": 507.23633, "r": 231.21053000000003, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89297, "r_y0": 516.14288, "r_x1": 231.21053000000003, "r_y1": 516.14288, "r_x2": 231.21053000000003, "r_y2": 507.23633, "r_x3": 227.89297, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.6936, "t": 507.23633, "r": 282.10947, "b": 516.14288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.6936, "r_y0": 516.14288, "r_x1": 282.10947, "r_y1": 516.14288, "r_x2": 282.10947, "r_y2": 507.23633, "r_x3": 259.6936, "r_y3": 507.23633, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.315002, "t": 519.1913099999999, "r": 117.38329000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 528.0978700000001, "r_x1": 117.38329000000002, "r_y1": 528.0978700000001, "r_x2": 117.38329000000002, "r_y2": 519.1913099999999, "r_x3": 66.315002, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.86766, "t": 519.1913099999999, "r": 153.68701, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 528.0978700000001, "r_x1": 153.68701, "r_y1": 528.0978700000001, "r_x2": 153.68701, "r_y2": 519.1913099999999, "r_x3": 134.86766, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57111, "t": 519.1913099999999, "r": 194.00566, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 528.0978700000001, "r_x1": 194.00566, "r_y1": 528.0978700000001, "r_x2": 194.00566, "r_y2": 519.1913099999999, "r_x3": 176.57111, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83495, "t": 519.1913099999999, "r": 238.26950000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 528.0978700000001, "r_x1": 238.26950000000002, "r_y1": 528.0978700000001, "r_x2": 238.26950000000002, "r_y2": 519.1913099999999, "r_x3": 220.83495, "r_y3": 519.1913099999999, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.189, "t": 519.0717500000001, "r": 279.62354, "b": 528.02814, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 528.02814, "r_x1": 279.62354, "r_y1": 528.02814, "r_x2": 279.62354, "r_y2": 519.0717500000001, "r_x3": 262.189, "r_y3": 519.0717500000001, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.612, "t": 536.49837, "r": 102.08514, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.612, "r_y0": 545.40492, "r_x1": 102.08514, "r_y1": 545.40492, "r_x2": 102.08514, "r_y2": 536.49837, "r_x3": 81.612, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91064, "t": 536.49837, "r": 150.64285, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91064, "r_y0": 545.40492, "r_x1": 150.64285, "r_y1": 545.40492, "r_x2": 150.64285, "r_y2": 536.49837, "r_x3": 137.91064, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.56554, "t": 536.49837, "r": 194.00009, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56554, "r_y0": 545.40492, "r_x1": 194.00009, "r_y1": 545.40492, "r_x2": 194.00009, "r_y2": 536.49837, "r_x3": 176.56554, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89285, "t": 536.49837, "r": 231.21040000000002, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89285, "r_y0": 545.40492, "r_x1": 231.21040000000002, "r_y1": 545.40492, "r_x2": 231.21040000000002, "r_y2": 536.49837, "r_x3": 227.89285, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18411, "t": 536.49837, "r": 279.61865, "b": 545.40492, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18411, "r_y0": 545.40492, "r_x1": 279.61865, "r_y1": 545.40492, "r_x2": 279.61865, "r_y2": 536.49837, "r_x3": 262.18411, "r_y3": 536.49837, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.315002, "t": 548.45436, "r": 117.38329000000002, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 557.36092, "r_x1": 117.38329000000002, "r_y1": 557.36092, "r_x2": 117.38329000000002, "r_y2": 548.45436, "r_x3": 66.315002, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.90625, "t": 548.45436, "r": 150.63846, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.90625, "r_y0": 557.36092, "r_x1": 150.63846, "r_y1": 557.36092, "r_x2": 150.63846, "r_y2": 548.45436, "r_x3": 137.90625, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57111, "t": 548.45436, "r": 194.00566, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 557.36092, "r_x1": 194.00566, "r_y1": 557.36092, "r_x2": 194.00566, "r_y2": 548.45436, "r_x3": 176.57111, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.88845999999998, "t": 548.45436, "r": 231.20601, "b": 557.36092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.88845999999998, "r_y0": 557.36092, "r_x1": 231.20601, "r_y1": 557.36092, "r_x2": 231.20601, "r_y2": 548.45436, "r_x3": 227.88845999999998, "r_y3": 548.45436, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.189, "t": 548.3348100000001, "r": 279.62354, "b": 557.2911799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.189, "r_y0": 557.2911799999999, "r_x1": 279.62354, "r_y1": 557.2911799999999, "r_x2": 279.62354, "r_y2": 548.3348100000001, "r_x3": 262.189, "r_y3": 548.3348100000001, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.315002, "t": 568.00237, "r": 117.38329000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.315002, "r_y0": 576.90892, "r_x1": 117.38329000000002, "r_y1": 576.90892, "r_x2": 117.38329000000002, "r_y2": 568.00237, "r_x3": 66.315002, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.86766, "t": 568.00237, "r": 153.68701, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86766, "r_y0": 576.90892, "r_x1": 153.68701, "r_y1": 576.90892, "r_x2": 153.68701, "r_y2": 568.00237, "r_x3": 134.86766, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57111, "t": 568.00237, "r": 194.00566, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57111, "r_y0": 576.90892, "r_x1": 194.00566, "r_y1": 576.90892, "r_x2": 194.00566, "r_y2": 568.00237, "r_x3": 176.57111, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83495, "t": 568.00237, "r": 238.26950000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83495, "r_y0": 576.90892, "r_x1": 238.26950000000002, "r_y1": 576.90892, "r_x2": 238.26950000000002, "r_y2": 568.00237, "r_x3": 220.83495, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.1897, "t": 568.00237, "r": 279.62424, "b": 576.90892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.1897, "r_y0": 576.90892, "r_x1": 279.62424, "r_y1": 576.90892, "r_x2": 279.62424, "r_y2": 568.00237, "r_x3": 262.1897, "r_y3": 568.00237, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 11, "num_cols": 5, "table_cells": [ { "bbox": { "l": 78.843002, "t": 420.69037, "r": 104.85535, "b": 429.59692, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 211.2, "t": 414.71237, "r": 236.10649, "b": 423.61893, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 129.338, "t": 426.66736, "r": 159.21584, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 171.17096, "t": 426.66736, "r": 199.40497, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 264.54044, "t": 426.66736, "r": 277.27264, "b": 435.57391000000007, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 443.62436, "r": 102.08514, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87206, "t": 443.62436, "r": 153.69141, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 443.62436, "r": 194.00009, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.82938000000001, "t": 443.62436, "r": 238.26393, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18414, "t": 443.62436, "r": 279.61868, "b": 452.53091, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.165001, "t": 455.58035, "r": 101.5323, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86716, "t": 455.58035, "r": 153.68651, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62411, "t": 455.58035, "r": 186.94167, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88795000000002, "t": 455.58035, "r": 231.20551, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69855, "t": 455.58035, "r": 282.11441, "b": 464.48691, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 468.13336, "r": 117.38329000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 468.13336, "r": 153.68701, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 468.13336, "r": 194.00566, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 468.13336, "r": 238.26950000000002, "b": 477.03992, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.698, "t": 468.01379, "r": 282.11386, "b": 476.97018, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 483.32635, "r": 102.08514, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87206, "t": 483.32635, "r": 153.69141, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 483.32635, "r": 194.00009, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 218.33870999999996, "t": 483.32635, "r": 240.75455999999997, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18411, "t": 483.32635, "r": 279.61865, "b": 492.23291, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.165001, "t": 495.28134, "r": 101.5323, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86716, "t": 495.28134, "r": 153.68651, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62411, "t": 495.28134, "r": 186.94167, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88795000000002, "t": 495.28134, "r": 231.20551, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69855, "t": 495.28134, "r": 282.11441, "b": 504.1879, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 71.789001, "t": 507.23633, "r": 111.90838999999998, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86221, "t": 507.23633, "r": 153.68156, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62914, "t": 507.23633, "r": 186.94669, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89297, "t": 507.23633, "r": 231.21053000000003, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.6936, "t": 507.23633, "r": 282.10947, "b": 516.14288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 519.1913099999999, "r": 117.38329000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 519.1913099999999, "r": 153.68701, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 519.1913099999999, "r": 194.00566, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 519.1913099999999, "r": 238.26950000000002, "b": 528.0978700000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.189, "t": 519.0717500000001, "r": 279.62354, "b": 528.02814, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.612, "t": 536.49837, "r": 102.08514, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91064, "t": 536.49837, "r": 150.64285, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.56554, "t": 536.49837, "r": 194.00009, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89285, "t": 536.49837, "r": 231.21040000000002, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18411, "t": 536.49837, "r": 279.61865, "b": 545.40492, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 548.45436, "r": 117.38329000000002, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.90625, "t": 548.45436, "r": 150.63846, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 548.45436, "r": 194.00566, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.88845999999998, "t": 548.45436, "r": 231.20601, "b": 557.36092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.189, "t": 548.3348100000001, "r": 279.62354, "b": 557.2911799999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.315002, "t": 568.00237, "r": 117.38329000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86766, "t": 568.00237, "r": 153.68701, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57111, "t": 568.00237, "r": 194.00566, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83495, "t": 568.00237, "r": 238.26950000000002, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.1897, "t": 568.00237, "r": 279.62424, "b": 576.90892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "text", "id": 15, "page_no": 6, "cluster": { "id": 15, "label": "text", "bbox": { "l": 50.112, "t": 592.43336, "r": 286.36511, "b": 613.29492, "coord_origin": "TOPLEFT" }, "confidence": 0.7209173440933228, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 601.33992, "r_x1": 286.36511, "r_y1": 601.33992, "r_x2": 286.36511, "r_y2": 592.43336, "r_x3": 50.112, "r_y3": 592.43336, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 613.29492, "r_x1": 247.46114, "r_y1": 613.29492, "r_x2": 247.46114, "r_y2": 604.38837, "r_x3": 50.112, "r_y3": 604.38837, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)." }, { "label": "text", "id": 16, "page_no": 6, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.112, "t": 616.34337, "r": 261.78732, "b": 625.24992, "coord_origin": "TOPLEFT" }, "confidence": 0.6433312892913818, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 625.24992, "r_x1": 261.78732, "r_y1": 625.24992, "r_x2": 261.78732, "r_y2": 616.34337, "r_x3": 50.112, "r_y3": 616.34337, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "FT: Model was trained on PubTabNet then finetuned." }, { "label": "text", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.112015, "t": 644.3498099999999, "r": 286.366, "b": 713.151932, "coord_origin": "TOPLEFT" }, "confidence": 0.9854635000228882, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 653.30618, "r_x1": 124.72179, "r_y1": 653.30618, "r_x2": 124.72179, "r_y2": 644.3498099999999, "r_x3": 62.067001, "r_y3": 644.3498099999999, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.20401, "r_y0": 653.37592, "r_x1": 242.9333, "r_y1": 653.37592, "r_x2": 242.9333, "r_y2": 644.46936, "r_x3": 128.20401, "r_y3": 644.46936, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55401999999998, "r_y0": 653.1467700000001, "r_x1": 286.36084, "r_y1": 653.1467700000001, "r_x2": 286.36084, "r_y2": 644.55902, "r_x3": 245.55401999999998, "r_y3": 644.55902, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 665.10178, "r_x1": 84.971146, "r_y1": 665.10178, "r_x2": 84.971146, "r_y2": 656.51402, "r_x3": 50.112015, "r_y3": 656.51402, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.515015, "r_y0": 665.33092, "r_x1": 286.366, "r_y1": 665.33092, "r_x2": 286.366, "r_y2": 656.42436, "r_x3": 89.515015, "r_y3": 656.42436, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 677.28593, "r_x1": 286.36511, "r_y1": 677.28593, "r_x2": 286.36511, "r_y2": 668.37936, "r_x3": 50.112015, "r_y3": 668.37936, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 689.24193, "r_x1": 286.36505, "r_y1": 689.24193, "r_x2": 286.36505, "r_y2": 680.33536, "r_x3": 50.112015, "r_y3": 680.33536, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.19693, "r_x1": 286.36511, "r_y1": 701.19693, "r_x2": 286.36511, "r_y2": 692.290359, "r_x3": 50.112015, "r_y3": 692.290359, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 713.151932, "r_x1": 286.36508, "r_y1": 713.151932, "r_x2": 286.36508, "r_y2": 704.245361, "r_x3": 50.112015, "r_y3": 704.245361, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate" }, { "label": "text", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.862, "t": 75.20836999999995, "r": 545.11517, "b": 227.57709, "coord_origin": "TOPLEFT" }, "confidence": 0.9713197946548462, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 84.11492999999996, "r_x1": 322.14215, "r_y1": 84.11492999999996, "r_x2": 322.14215, "r_y2": 75.20836999999995, "r_x3": 308.862, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45401, "r_y0": 83.88580000000002, "r_x1": 404.56702, "r_y1": 83.88580000000002, "r_x2": 404.56702, "r_y2": 75.29803000000004, "r_x3": 325.45401, "r_y3": 75.29803000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.104, "r_y0": 84.11492999999996, "r_x1": 545.10968, "r_y1": 84.11492999999996, "r_x2": 545.10968, "r_y2": 75.20836999999995, "r_x3": 408.104, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 96.06994999999995, "r_x1": 545.11511, "r_y1": 96.06994999999995, "r_x2": 545.11511, "r_y2": 87.16339000000005, "r_x3": 308.862, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 108.02495999999985, "r_x1": 470.22626, "r_y1": 108.02495999999985, "r_x2": 470.22626, "r_y2": 99.11841000000004, "r_x3": 308.862, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.52884, "r_y0": 108.02495999999985, "r_x1": 545.11511, "r_y1": 108.02495999999985, "r_x2": 545.11511, "r_y2": 99.11841000000004, "r_x3": 477.52884, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 119.97997999999984, "r_x1": 545.11517, "r_y1": 119.97997999999984, "r_x2": 545.11517, "r_y2": 111.07343000000003, "r_x3": 308.862, "r_y3": 111.07343000000003, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 131.93499999999995, "r_x1": 545.11511, "r_y1": 131.93499999999995, "r_x2": 545.11511, "r_y2": 123.02844000000005, "r_x3": 308.862, "r_y3": 123.02844000000005, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 143.89099, "r_x1": 502.01691000000005, "r_y1": 143.89099, "r_x2": 502.01691000000005, "r_y2": 134.98443999999995, "r_x3": 308.862, "r_y3": 134.98443999999995, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47299, "r_y0": 143.66187000000002, "r_x1": 545.11041, "r_y1": 143.66187000000002, "r_x2": 545.11041, "r_y2": 135.07410000000004, "r_x3": 504.47299, "r_y3": 135.07410000000004, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 155.61688000000004, "r_x1": 343.16324, "r_y1": 155.61688000000004, "r_x2": 343.16324, "r_y2": 147.02910999999995, "r_x3": 308.862, "r_y3": 147.02910999999995, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.371, "r_y0": 155.84600999999998, "r_x1": 545.11493, "r_y1": 155.84600999999998, "r_x2": 545.11493, "r_y2": 146.93944999999997, "r_x3": 346.371, "r_y3": 146.93944999999997, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 167.80102999999997, "r_x1": 446.15652, "r_y1": 167.80102999999997, "r_x2": 446.15652, "r_y2": 158.89446999999996, "r_x3": 308.862, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.28998000000007, "r_y0": 167.57190000000003, "r_x1": 525.04181, "r_y1": 167.57190000000003, "r_x2": 525.04181, "r_y2": 158.98413000000005, "r_x3": 448.28998000000007, "r_y3": 158.98413000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.39899, "r_y0": 167.80102999999997, "r_x1": 545.11249, "r_y1": 167.80102999999997, "r_x2": 545.11249, "r_y2": 158.89446999999996, "r_x3": 527.39899, "r_y3": 158.89446999999996, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 179.75603999999998, "r_x1": 545.11511, "r_y1": 179.75603999999998, "r_x2": 545.11511, "r_y2": 170.84948999999995, "r_x3": 308.862, "r_y3": 170.84948999999995, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 191.71105999999997, "r_x1": 432.86642000000006, "r_y1": 191.71105999999997, "r_x2": 432.86642000000006, "r_y2": 182.80449999999996, "r_x3": 308.862, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39001, "r_y0": 191.48193000000003, "r_x1": 510.93021, "r_y1": 191.48193000000003, "r_x2": 510.93021, "r_y2": 182.89417000000003, "r_x3": 436.39001, "r_y3": 182.89417000000003, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.677, "r_y0": 191.71105999999997, "r_x1": 545.11273, "r_y1": 191.71105999999997, "r_x2": 545.11273, "r_y2": 182.80449999999996, "r_x3": 514.677, "r_y3": 182.80449999999996, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 203.66607999999997, "r_x1": 431.17285, "r_y1": 203.66607999999997, "r_x2": 431.17285, "r_y2": 194.75951999999995, "r_x3": 308.862, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6790199999999, "r_y0": 203.43695000000002, "r_x1": 514.18054, "r_y1": 203.43695000000002, "r_x2": 514.18054, "r_y2": 194.84918000000005, "r_x3": 434.6790199999999, "r_y3": 194.84918000000005, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.17603, "r_y0": 203.66607999999997, "r_x1": 545.10992, "r_y1": 203.66607999999997, "r_x2": 545.10992, "r_y2": 194.75951999999995, "r_x3": 514.17603, "r_y3": 194.75951999999995, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 215.39293999999995, "r_x1": 382.35614, "r_y1": 215.39293999999995, "r_x2": 382.35614, "r_y2": 206.80517999999995, "r_x3": 308.86203, "r_y3": 206.80517999999995, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.07501, "r_y0": 215.62207, "r_x1": 545.11426, "r_y1": 215.62207, "r_x2": 545.11426, "r_y2": 206.71551999999997, "r_x3": 385.07501, "r_y3": 206.71551999999997, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 227.57709, "r_x1": 501.6981799999999, "r_y1": 227.57709, "r_x2": 501.6981799999999, "r_y2": 218.67052999999999, "r_x3": 308.862, "r_y3": 218.67052999999999, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes." }, { "label": "table", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "table", "bbox": { "l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT" }, "confidence": 0.9691730737686157, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.323, "t": 253.66436999999996, "r": 365.33536, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.323, "r_y0": 262.57092, "r_x1": 365.33536, "r_y1": 262.57092, "r_x2": 365.33536, "r_y2": 253.66436999999996, "r_x3": 339.323, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04132, "t": 253.66436999999996, "r": 430.91916, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04132, "r_y0": 262.57092, "r_x1": 430.91916, "r_y1": 262.57092, "r_x2": 430.91916, "r_y2": 253.66436999999996, "r_x3": 401.04132, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.10214, "t": 253.66436999999996, "r": 474.58523999999994, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.10214, "r_y0": 262.57092, "r_x1": 474.58523999999994, "r_y1": 262.57092, "r_x2": 474.58523999999994, "r_y2": 253.66436999999996, "r_x3": 454.10214, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54034, "t": 253.66436999999996, "r": 527.2276, "b": 262.57092, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54034, "r_y0": 262.57092, "r_x1": 527.2276, "r_y1": 262.57092, "r_x2": 527.2276, "r_y2": 253.66436999999996, "r_x3": 486.54034, "r_y3": 253.66436999999996, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.65601, "t": 270.62134000000003, "r": 377.00076, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.65601, "r_y0": 279.52788999999996, "r_x1": 377.00076, "r_y1": 279.52788999999996, "r_x2": 377.00076, "r_y2": 270.62134000000003, "r_x3": 327.65601, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.69809, "t": 270.62134000000003, "r": 438.28073, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69809, "r_y0": 279.52788999999996, "r_x1": 438.28073, "r_y1": 279.52788999999996, "r_x2": 438.28073, "r_y2": 270.62134000000003, "r_x3": 393.69809, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.63559, "t": 270.62134000000003, "r": 473.07013, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63559, "r_y0": 279.52788999999996, "r_x1": 473.07013, "r_y1": 279.52788999999996, "r_x2": 473.07013, "r_y2": 270.62134000000003, "r_x3": 455.63559, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.16592, "t": 270.62134000000003, "r": 515.60046, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.16592, "r_y0": 279.52788999999996, "r_x1": 515.60046, "r_y1": 279.52788999999996, "r_x2": 515.60046, "r_y2": 270.62134000000003, "r_x3": 498.16592, "r_y3": 270.62134000000003, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.79501, "t": 282.57631999999995, "r": 377.86331, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 291.48288, "r_x1": 377.86331, "r_y1": 291.48288, "r_x2": 377.86331, "r_y2": 282.57631999999995, "r_x3": 326.79501, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69388, "t": 282.57631999999995, "r": 438.27652, "b": 291.48288, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69388, "r_y0": 291.48288, "r_x1": 438.27652, "r_y1": 291.48288, "r_x2": 438.27652, "r_y2": 282.57631999999995, "r_x3": 393.69388, "r_y3": 282.57631999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63101, "t": 282.45676, "r": 473.06555000000003, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63101, "r_y0": 291.41315, "r_x1": 473.06555000000003, "r_y1": 291.41315, "r_x2": 473.06555000000003, "r_y2": 282.45676, "r_x3": 455.63101, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.1713, "t": 282.45676, "r": 515.60583, "b": 291.41315, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.1713, "r_y0": 291.41315, "r_x1": 515.60583, "r_y1": 291.41315, "r_x2": 515.60583, "r_y2": 282.45676, "r_x3": 498.1713, "r_y3": 282.45676, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.79501, "t": 294.53131, "r": 377.86331, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 303.43787, "r_x1": 377.86331, "r_y1": 303.43787, "r_x2": 377.86331, "r_y2": 294.53131, "r_x3": 326.79501, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.81842, "t": 294.53131, "r": 442.15194999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.81842, "r_y0": 303.43787, "r_x1": 442.15194999999994, "r_y1": 303.43787, "r_x2": 442.15194999999994, "r_y2": 294.53131, "r_x3": 389.81842, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63135, "t": 294.53131, "r": 473.06589, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63135, "r_y0": 303.43787, "r_x1": 473.06589, "r_y1": 303.43787, "r_x2": 473.06589, "r_y2": 294.53131, "r_x3": 455.63135, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.22515999999996, "t": 294.53131, "r": 508.54268999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.22515999999996, "r_y0": 303.43787, "r_x1": 508.54268999999994, "r_y1": 303.43787, "r_x2": 508.54268999999994, "r_y2": 294.53131, "r_x3": 505.22515999999996, "r_y3": 294.53131, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 4, "num_cols": 4, "table_cells": [ { "bbox": { "l": 339.323, "t": 253.66436999999996, "r": 365.33536, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 401.04132, "t": 253.66436999999996, "r": 430.91916, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 454.10214, "t": 253.66436999999996, "r": 474.58523999999994, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 486.54034, "t": 253.66436999999996, "r": 527.2276, "b": 262.57092, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 327.65601, "t": 270.62134000000003, "r": 377.00076, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69809, "t": 270.62134000000003, "r": 438.28073, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63559, "t": 270.62134000000003, "r": 473.07013, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.16592, "t": 270.62134000000003, "r": 515.60046, "b": 279.52788999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.79501, "t": 282.57631999999995, "r": 377.86331, "b": 291.48288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69388, "t": 282.57631999999995, "r": 438.27652, "b": 291.48288, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63101, "t": 282.45676, "r": 473.06555000000003, "b": 291.41315, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.1713, "t": 282.45676, "r": 515.60583, "b": 291.41315, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.79501, "t": 294.53131, "r": 377.86331, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 389.81842, "t": 294.53131, "r": 442.15194999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63135, "t": 294.53131, "r": 473.06589, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 505.22515999999996, "t": 294.53131, "r": 508.54268999999994, "b": 303.43787, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "caption", "bbox": { "l": 308.862, "t": 316.44931, "r": 545.11517, "b": 337.3108500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9519917964935303, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 325.35587, "r_x1": 341.49951, "r_y1": 325.35587, "r_x2": 341.49951, "r_y2": 316.44931, "r_x3": 308.862, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.60284, "r_y0": 325.35587, "r_x1": 545.11517, "r_y1": 325.35587, "r_x2": 545.11517, "r_y2": 316.44931, "r_x3": 348.60284, "r_y3": 316.44931, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.3108500000001, "r_x1": 474.97845, "r_y1": 337.3108500000001, "r_x2": 474.97845, "r_y2": 328.4043, "r_x3": 308.862, "r_y3": 328.4043, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing." }, { "label": "text", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86197, "t": 367.6797199999999, "r": 545.11566, "b": 520.16769, "coord_origin": "TOPLEFT" }, "confidence": 0.9835010766983032, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 376.63611, "r_x1": 378.94876, "r_y1": 376.63611, "r_x2": 378.94876, "r_y2": 367.6797199999999, "r_x3": 320.81699, "r_y3": 367.6797199999999, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.07898, "r_y0": 376.70584, "r_x1": 545.11566, "r_y1": 376.70584, "r_x2": 545.11566, "r_y2": 367.79929, "r_x3": 387.07898, "r_y3": 367.79929, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 388.66083, "r_x1": 487.19257, "r_y1": 388.66083, "r_x2": 487.19257, "r_y2": 379.75426999999996, "r_x3": 308.86197, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.96713, "r_y0": 388.66083, "r_x1": 545.11511, "r_y1": 388.66083, "r_x2": 545.11511, "r_y2": 379.75426999999996, "r_x3": 493.96713, "r_y3": 379.75426999999996, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 400.61581, "r_x1": 545.11505, "r_y1": 400.61581, "r_x2": 545.11505, "r_y2": 391.70926, "r_x3": 308.86197, "r_y3": 391.70926, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 412.57181, "r_x1": 545.11523, "r_y1": 412.57181, "r_x2": 545.11523, "r_y2": 403.66525, "r_x3": 308.86197, "r_y3": 403.66525, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 424.52679, "r_x1": 314.08096, "r_y1": 424.52679, "r_x2": 314.08096, "r_y2": 415.62024, "r_x3": 308.86197, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69046, "r_y0": 424.52679, "r_x1": 545.11517, "r_y1": 424.52679, "r_x2": 545.11517, "r_y2": 415.62024, "r_x3": 316.69046, "r_y3": 415.62024, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 436.48177999999996, "r_x1": 545.11505, "r_y1": 436.48177999999996, "r_x2": 545.11505, "r_y2": 427.57523, "r_x3": 308.86197, "r_y3": 427.57523, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 448.43677, "r_x1": 545.11505, "r_y1": 448.43677, "r_x2": 545.11505, "r_y2": 439.53021, "r_x3": 308.86197, "r_y3": 439.53021, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 460.39175, "r_x1": 350.23666, "r_y1": 460.39175, "r_x2": 350.23666, "r_y2": 451.4852, "r_x3": 308.86197, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.17596, "r_y0": 460.32201999999995, "r_x1": 374.59183, "r_y1": 460.32201999999995, "r_x2": 374.59183, "r_y2": 451.36563, "r_x3": 352.17596, "r_y3": 451.36563, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53296, "r_y0": 460.39175, "r_x1": 545.11011, "r_y1": 460.39175, "r_x2": 545.11011, "r_y2": 451.4852, "r_x3": 376.53296, "r_y3": 451.4852, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 472.34674, "r_x1": 545.11511, "r_y1": 472.34674, "r_x2": 545.11511, "r_y2": 463.44019, "r_x3": 308.86197, "r_y3": 463.44019, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 484.30273, "r_x1": 545.11517, "r_y1": 484.30273, "r_x2": 545.11517, "r_y2": 475.39618, "r_x3": 308.86197, "r_y3": 475.39618, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 496.25772, "r_x1": 545.11511, "r_y1": 496.25772, "r_x2": 545.11511, "r_y2": 487.35117, "r_x3": 308.86197, "r_y3": 487.35117, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 508.21271, "r_x1": 545.11505, "r_y1": 508.21271, "r_x2": 545.11505, "r_y2": 499.30615, "r_x3": 308.86197, "r_y3": 499.30615, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 520.16769, "r_x1": 405.69846, "r_y1": 520.16769, "r_x2": 405.69846, "r_y2": 511.26114, "r_x3": 308.86197, "r_y3": 511.26114, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations." }, { "label": "table", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "table", "bbox": { "l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT" }, "confidence": 0.9775567650794983, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01099, "t": 552.23337, "r": 384.02335, "b": 561.1399200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01099, "r_y0": 561.1399200000001, "r_x1": 384.02335, "r_y1": 561.1399200000001, "r_x2": 384.02335, "r_y2": 552.23337, "r_x3": 358.01099, "r_y3": 552.23337, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03400000000005, "t": 546.25537, "r": 473.94049000000007, "b": 555.16193, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03400000000005, "r_y0": 555.16193, "r_x1": 473.94049000000007, "r_y1": 555.16193, "r_x2": 473.94049000000007, "r_y2": 546.25537, "r_x3": 449.03400000000005, "r_y3": 546.25537, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.50598, "t": 558.21037, "r": 436.73999, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.50598, "r_y0": 567.11693, "r_x1": 436.73999, "r_y1": 567.11693, "r_x2": 436.73999, "r_y2": 558.21037, "r_x3": 408.50598, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.6951, "t": 558.21037, "r": 485.07849, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.6951, "r_y0": 567.11693, "r_x1": 485.07849, "r_y1": 567.11693, "r_x2": 485.07849, "r_y2": 558.21037, "r_x3": 448.6951, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.3848, "t": 558.21037, "r": 512.117, "b": 567.11693, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.3848, "r_y0": 567.11693, "r_x1": 512.117, "r_y1": 567.11693, "r_x2": 512.117, "r_y2": 558.21037, "r_x3": 499.3848, "r_y3": 558.21037, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68201, "t": 575.16736, "r": 384.3519, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68201, "r_y0": 584.0739100000001, "r_x1": 384.3519, "r_y1": 584.0739100000001, "r_x2": 384.3519, "r_y2": 575.16736, "r_x3": 357.68201, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.90097, "t": 575.16736, "r": 431.33550999999994, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90097, "r_y0": 584.0739100000001, "r_x1": 431.33550999999994, "r_y1": 584.0739100000001, "r_x2": 431.33550999999994, "r_y2": 575.16736, "r_x3": 413.90097, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16479000000004, "t": 575.16736, "r": 475.59933000000007, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16479000000004, "r_y0": 584.0739100000001, "r_x1": 475.59933000000007, "r_y1": 584.0739100000001, "r_x2": 475.59933000000007, "r_y2": 575.16736, "r_x3": 458.16479000000004, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.0289, "t": 575.16736, "r": 514.46344, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0289, "r_y0": 584.0739100000001, "r_x1": 514.46344, "r_y1": 584.0739100000001, "r_x2": 514.46344, "r_y2": 575.16736, "r_x3": 497.0289, "r_y3": 575.16736, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72299, "t": 587.12236, "r": 391.31064, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72299, "r_y0": 596.02892, "r_x1": 391.31064, "r_y1": 596.02892, "r_x2": 391.31064, "r_y2": 587.12236, "r_x3": 350.72299, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.90582, "t": 587.12236, "r": 431.34036, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90582, "r_y0": 596.02892, "r_x1": 431.34036, "r_y1": 596.02892, "r_x2": 431.34036, "r_y2": 587.12236, "r_x3": 413.90582, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.16965, "t": 587.12236, "r": 475.60419, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16965, "r_y0": 596.02892, "r_x1": 475.60419, "r_y1": 596.02892, "r_x2": 475.60419, "r_y2": 587.12236, "r_x3": 458.16965, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03374999999994, "t": 587.12236, "r": 514.46832, "b": 596.02892, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03374999999994, "r_y0": 596.02892, "r_x1": 514.46832, "r_y1": 596.02892, "r_x2": 514.46832, "r_y2": 587.12236, "r_x3": 497.03374999999994, "r_y3": 587.12236, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.13599, "t": 599.07835, "r": 387.89923, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.13599, "r_y0": 607.98491, "r_x1": 387.89923, "r_y1": 607.98491, "r_x2": 387.89923, "r_y2": 599.07835, "r_x3": 354.13599, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.90161, "t": 599.07835, "r": 431.33615, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90161, "r_y0": 607.98491, "r_x1": 431.33615, "r_y1": 607.98491, "r_x2": 431.33615, "r_y2": 599.07835, "r_x3": 413.90161, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.16544, "t": 599.07835, "r": 475.59998, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16544, "r_y0": 607.98491, "r_x1": 475.59998, "r_y1": 607.98491, "r_x2": 475.59998, "r_y2": 599.07835, "r_x3": 458.16544, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.02954000000005, "t": 599.07835, "r": 514.46411, "b": 607.98491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.02954000000005, "r_y0": 607.98491, "r_x1": 514.46411, "r_y1": 607.98491, "r_x2": 514.46411, "r_y2": 599.07835, "r_x3": 497.02954000000005, "r_y3": 599.07835, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.55899, "t": 611.03336, "r": 395.47534, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.55899, "r_y0": 619.93991, "r_x1": 395.47534, "r_y1": 619.93991, "r_x2": 395.47534, "r_y2": 611.03336, "r_x3": 346.55899, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.90616, "t": 611.03336, "r": 431.34069999999997, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 619.93991, "r_x1": 431.34069999999997, "r_y1": 619.93991, "r_x2": 431.34069999999997, "r_y2": 611.03336, "r_x3": 413.90616, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.16998000000007, "t": 611.03336, "r": 475.60452, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 619.93991, "r_x1": 475.60452, "r_y1": 619.93991, "r_x2": 475.60452, "r_y2": 611.03336, "r_x3": 458.16998000000007, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03409, "t": 611.03336, "r": 514.46863, "b": 619.93991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03409, "r_y0": 619.93991, "r_x1": 514.46863, "r_y1": 619.93991, "r_x2": 514.46863, "r_y2": 611.03336, "r_x3": 497.03409, "r_y3": 611.03336, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78101, "t": 622.9883600000001, "r": 381.25415, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78101, "r_y0": 631.89491, "r_x1": 381.25415, "r_y1": 631.89491, "r_x2": 381.25415, "r_y2": 622.9883600000001, "r_x3": 360.78101, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.90158, "t": 622.9883600000001, "r": 431.33612, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90158, "r_y0": 631.89491, "r_x1": 431.33612, "r_y1": 631.89491, "r_x2": 431.33612, "r_y2": 622.9883600000001, "r_x3": 413.90158, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.16541, "t": 622.9883600000001, "r": 475.59995000000004, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16541, "r_y0": 631.89491, "r_x1": 475.59995000000004, "r_y1": 631.89491, "r_x2": 475.59995000000004, "r_y2": 622.9883600000001, "r_x3": 458.16541, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.0295100000001, "t": 622.9883600000001, "r": 514.46405, "b": 631.89491, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.0295100000001, "r_y0": 631.89491, "r_x1": 514.46405, "r_y1": 631.89491, "r_x2": 514.46405, "r_y2": 622.9883600000001, "r_x3": 497.0295100000001, "r_y3": 622.9883600000001, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.483, "t": 634.94336, "r": 396.5513, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.483, "r_y0": 643.84991, "r_x1": 396.5513, "r_y1": 643.84991, "r_x2": 396.5513, "r_y2": 634.94336, "r_x3": 345.483, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.90616, "t": 634.94336, "r": 431.34069999999997, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.90616, "r_y0": 643.84991, "r_x1": 431.34069999999997, "r_y1": 643.84991, "r_x2": 431.34069999999997, "r_y2": 634.94336, "r_x3": 413.90616, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.16998000000007, "t": 634.94336, "r": 475.60452, "b": 643.84991, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16998000000007, "r_y0": 643.84991, "r_x1": 475.60452, "r_y1": 643.84991, "r_x2": 475.60452, "r_y2": 634.94336, "r_x3": 458.16998000000007, "r_y3": 634.94336, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03400000000005, "t": 634.82381, "r": 514.46857, "b": 643.78018, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03400000000005, "r_y0": 643.78018, "r_x1": 514.46857, "r_y1": 643.78018, "r_x2": 514.46857, "r_y2": 634.82381, "r_x3": 497.03400000000005, "r_y3": 634.82381, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 4, "table_cells": [ { "bbox": { "l": 358.01099, "t": 552.23337, "r": 384.02335, "b": 561.1399200000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.03400000000005, "t": 546.25537, "r": 473.94049000000007, "b": 555.16193, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 408.50598, "t": 558.21037, "r": 436.73999, "b": 567.11693, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 499.3848, "t": 558.21037, "r": 512.117, "b": 567.11693, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 357.68201, "t": 575.16736, "r": 384.3519, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90097, "t": 575.16736, "r": 431.33550999999994, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16479000000004, "t": 575.16736, "r": 475.59933000000007, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.0289, "t": 575.16736, "r": 514.46344, "b": 584.0739100000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 350.72299, "t": 587.12236, "r": 391.31064, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90582, "t": 587.12236, "r": 431.34036, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16965, "t": 587.12236, "r": 475.60419, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03374999999994, "t": 587.12236, "r": 514.46832, "b": 596.02892, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 354.13599, "t": 599.07835, "r": 387.89923, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90161, "t": 599.07835, "r": 431.33615, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16544, "t": 599.07835, "r": 475.59998, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.02954000000005, "t": 599.07835, "r": 514.46411, "b": 607.98491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 346.55899, "t": 611.03336, "r": 395.47534, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90616, "t": 611.03336, "r": 431.34069999999997, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16998000000007, "t": 611.03336, "r": 475.60452, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03409, "t": 611.03336, "r": 514.46863, "b": 619.93991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 360.78101, "t": 622.9883600000001, "r": 381.25415, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90158, "t": 622.9883600000001, "r": 431.33612, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16541, "t": 622.9883600000001, "r": 475.59995000000004, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.0295100000001, "t": 622.9883600000001, "r": 514.46405, "b": 631.89491, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 345.483, "t": 634.94336, "r": 396.5513, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.90616, "t": 634.94336, "r": 431.34069999999997, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16998000000007, "t": 634.94336, "r": 475.60452, "b": 643.84991, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03400000000005, "t": 634.82381, "r": 514.46857, "b": 643.78018, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.862, "t": 656.86136, "r": 545.11517, "b": 689.6779300000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9541404247283936, "cells": [ { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 665.76792, "r_x1": 341.73862, "r_y1": 665.76792, "r_x2": 341.73862, "r_y2": 656.86136, "r_x3": 308.862, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.55927, "r_y0": 665.76792, "r_x1": 545.11517, "r_y1": 665.76792, "r_x2": 545.11517, "r_y2": 656.86136, "r_x3": 349.55927, "r_y3": 656.86136, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 677.7229199999999, "r_x1": 545.11505, "r_y1": 677.7229199999999, "r_x2": 545.11505, "r_y2": 668.81636, "r_x3": 308.862, "r_y3": 668.81636, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 689.6779300000001, "r_x1": 435.03836, "r_y1": 689.6779300000001, "r_x2": 435.03836, "r_y2": 680.77136, "r_x3": 308.862, "r_y3": 680.77136, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables." } ], "headers": [ { "label": "page_footer", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133358, "r": 300.10229, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.8787972331047058, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039921, "r_x1": 300.10229, "r_y1": 743.039921, "r_x2": 300.10229, "r_y2": 734.133358, "r_x3": 295.121, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" } ] } }, { "page_no": 7, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 216.10645, "r_x1": 62.219952, "r_y1": 216.10645, "r_x2": 62.219952, "r_y2": 208.23328000000004, "r_x3": 53.811783000000005, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.424026, "r_y0": 216.10645, "r_x1": 385.93451, "r_y1": 216.10645, "r_x2": 385.93451, "r_y2": 208.23328000000004, "r_x3": 66.424026, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 102.15430000000003, "r_x1": 284.34592, "r_y1": 102.15430000000003, "r_x2": 284.34592, "r_y2": 94.28112999999996, "r_x3": 53.811783000000005, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83081, "r_y0": 102.15430000000003, "r_x1": 431.09119, "r_y1": 102.15430000000003, "r_x2": 431.09119, "r_y2": 94.28112999999996, "r_x3": 304.83081, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.286037, "r_y0": 86.56073000000004, "r_x1": 61.550289, "r_y1": 86.56073000000004, "r_x2": 61.550289, "r_y2": 78.68756000000008, "r_x3": 53.286037, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.682419, "r_y0": 86.56073000000004, "r_x1": 499.55563, "r_y1": 86.56073000000004, "r_x2": 499.55563, "r_y2": 78.68756000000008, "r_x3": 65.682419, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.42731, "r_y0": 298.60284, "r_x1": 549.42175, "r_y1": 298.60284, "r_x2": 549.42175, "r_y2": 292.30426, "r_x3": 380.42731, "r_y3": 292.30426, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 329.78391, "r_x1": 86.864021, "r_y1": 329.78391, "r_x2": 86.864021, "r_y2": 320.87735, "r_x3": 50.112, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.917542, "r_y0": 329.78391, "r_x1": 545.11371, "r_y1": 329.78391, "r_x2": 545.11371, "r_y2": 320.87735, "r_x3": 93.917542, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 341.73889, "r_x1": 545.11371, "r_y1": 341.73889, "r_x2": 545.11371, "r_y2": 332.83233999999993, "r_x3": 50.112, "r_y3": 332.83233999999993, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 353.69388, "r_x1": 545.11377, "r_y1": 353.69388, "r_x2": 545.11377, "r_y2": 344.78732, "r_x3": 50.112, "r_y3": 344.78732, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.64987, "r_x1": 139.79532, "r_y1": 365.64987, "r_x2": 139.79532, "r_y2": 356.74332, "r_x3": 50.112, "r_y3": 356.74332, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26282, "r_y0": 386.44281, "r_x1": 342.07819, "r_y1": 386.44281, "r_x2": 342.07819, "r_y2": 381.77722, "r_x3": 220.26282, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.715248, "r_y0": 386.44281, "r_x1": 85.657333, "r_y1": 386.44281, "r_x2": 85.657333, "r_y2": 381.77722, "r_x3": 53.715248, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 406.87158, "r_x1": 443.69870000000003, "r_y1": 406.87158, "r_x2": 443.69870000000003, "r_y2": 400.55295, "r_x3": 437.37939, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 406.87158, "r_x1": 456.6513100000001, "r_y1": 406.87158, "r_x2": 456.6513100000001, "r_y2": 400.55295, "r_x3": 450.33203, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 406.87158, "r_x1": 469.60394, "r_y1": 406.87158, "r_x2": 469.60394, "r_y2": 400.55295, "r_x3": 463.28464, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23724000000004, "r_y0": 406.87158, "r_x1": 482.5565500000001, "r_y1": 406.87158, "r_x2": 482.5565500000001, "r_y2": 400.55295, "r_x3": 476.23724000000004, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18988, "r_y0": 406.87158, "r_x1": 495.50916, "r_y1": 406.87158, "r_x2": 495.50916, "r_y2": 400.55295, "r_x3": 489.18988, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14251999999993, "r_y0": 406.87158, "r_x1": 508.46178999999995, "r_y1": 406.87158, "r_x2": 508.46178999999995, "r_y2": 400.55295, "r_x3": 502.14251999999993, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09509, "r_y0": 406.87158, "r_x1": 521.41443, "r_y1": 406.87158, "r_x2": 521.41443, "r_y2": 400.55295, "r_x3": 515.09509, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 417.35699, "r_x1": 391.60071, "r_y1": 417.35699, "r_x2": 391.60071, "r_y2": 411.03836000000007, "r_x3": 385.2814, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 417.35699, "r_x1": 404.84271, "r_y1": 417.35699, "r_x2": 404.84271, "r_y2": 411.03836000000007, "r_x3": 398.52341, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 417.35699, "r_x1": 417.79535, "r_y1": 417.35699, "r_x2": 417.79535, "r_y2": 411.03836000000007, "r_x3": 411.47604, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 417.35699, "r_x1": 443.69870000000003, "r_y1": 417.35699, "r_x2": 443.69870000000003, "r_y2": 411.03836000000007, "r_x3": 437.37939, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 417.35699, "r_x1": 456.6513100000001, "r_y1": 417.35699, "r_x2": 456.6513100000001, "r_y2": 411.03836000000007, "r_x3": 450.33203, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 417.35699, "r_x1": 469.60394, "r_y1": 417.35699, "r_x2": 469.60394, "r_y2": 411.03836000000007, "r_x3": 463.28464, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 427.38834, "r_x1": 391.60071, "r_y1": 427.38834, "r_x2": 391.60071, "r_y2": 421.0697, "r_x3": 385.2814, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 427.38834, "r_x1": 404.84271, "r_y1": 427.38834, "r_x2": 404.84271, "r_y2": 421.0697, "r_x3": 398.52341, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 427.38834, "r_x1": 417.79532, "r_y1": 427.38834, "r_x2": 417.79532, "r_y2": 421.0697, "r_x3": 411.47604, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 427.38834, "r_x1": 430.74796, "r_y1": 427.38834, "r_x2": 430.74796, "r_y2": 421.0697, "r_x3": 424.42865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 427.38834, "r_x1": 443.70056, "r_y1": 427.38834, "r_x2": 443.70056, "r_y2": 421.0697, "r_x3": 437.38129, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 427.38834, "r_x1": 456.65319999999997, "r_y1": 427.38834, "r_x2": 456.65319999999997, "r_y2": 421.0697, "r_x3": 450.33389000000005, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 427.38834, "r_x1": 469.6058, "r_y1": 427.38834, "r_x2": 469.6058, "r_y2": 421.0697, "r_x3": 463.2865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 427.38834, "r_x1": 482.55841, "r_y1": 427.38834, "r_x2": 482.55841, "r_y2": 421.0697, "r_x3": 476.23914, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 427.38834, "r_x1": 495.51105, "r_y1": 427.38834, "r_x2": 495.51105, "r_y2": 421.0697, "r_x3": 489.1917700000001, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 427.38834, "r_x1": 508.46368, "r_y1": 427.38834, "r_x2": 508.46368, "r_y2": 421.0697, "r_x3": 502.14438, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 427.38834, "r_x1": 521.41632, "r_y1": 427.38834, "r_x2": 521.41632, "r_y2": 421.0697, "r_x3": 515.09705, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 427.38834, "r_x1": 534.3689, "r_y1": 427.38834, "r_x2": 534.3689, "r_y2": 421.0697, "r_x3": 528.04962, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 438.36295, "r_x1": 391.60071, "r_y1": 438.36295, "r_x2": 391.60071, "r_y2": 432.04431, "r_x3": 385.2814, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 438.36295, "r_x1": 404.84271, "r_y1": 438.36295, "r_x2": 404.84271, "r_y2": 432.04431, "r_x3": 398.52341, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 438.36295, "r_x1": 417.79532, "r_y1": 438.36295, "r_x2": 417.79532, "r_y2": 432.04431, "r_x3": 411.47604, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 438.36295, "r_x1": 430.74796, "r_y1": 438.36295, "r_x2": 430.74796, "r_y2": 432.04431, "r_x3": 424.42865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 438.36295, "r_x1": 443.70056, "r_y1": 438.36295, "r_x2": 443.70056, "r_y2": 432.04431, "r_x3": 437.38129, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 438.36295, "r_x1": 456.65319999999997, "r_y1": 438.36295, "r_x2": 456.65319999999997, "r_y2": 432.04431, "r_x3": 450.33389000000005, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 438.36295, "r_x1": 469.6058, "r_y1": 438.36295, "r_x2": 469.6058, "r_y2": 432.04431, "r_x3": 463.2865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 438.36295, "r_x1": 482.55841, "r_y1": 438.36295, "r_x2": 482.55841, "r_y2": 432.04431, "r_x3": 476.23914, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 438.36295, "r_x1": 495.51105, "r_y1": 438.36295, "r_x2": 495.51105, "r_y2": 432.04431, "r_x3": 489.1917700000001, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 438.36295, "r_x1": 508.46368, "r_y1": 438.36295, "r_x2": 508.46368, "r_y2": 432.04431, "r_x3": 502.14438, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 438.36295, "r_x1": 521.41632, "r_y1": 438.36295, "r_x2": 521.41632, "r_y2": 432.04431, "r_x3": 515.09705, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 438.36295, "r_x1": 534.3689, "r_y1": 438.36295, "r_x2": 534.3689, "r_y2": 432.04431, "r_x3": 528.04962, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 395.51868, "r_x1": 388.44073, "r_y1": 395.51868, "r_x2": 388.44073, "r_y2": 389.20004, "r_x3": 385.2814, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 395.51868, "r_x1": 401.68274, "r_y1": 395.51868, "r_x2": 401.68274, "r_y2": 389.20004, "r_x3": 398.52341, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.4754, "r_y0": 395.51868, "r_x1": 414.63474, "r_y1": 395.51868, "r_x2": 414.63474, "r_y2": 389.20004, "r_x3": 411.4754, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.4274, "r_y0": 395.51868, "r_x1": 427.58673, "r_y1": 395.51868, "r_x2": 427.58673, "r_y2": 389.20004, "r_x3": 424.4274, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 395.51868, "r_x1": 440.53870000000006, "r_y1": 395.51868, "r_x2": 440.53870000000006, "r_y2": 389.20004, "r_x3": 437.37939, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33136, "r_y0": 395.51868, "r_x1": 453.49069000000003, "r_y1": 395.51868, "r_x2": 453.49069000000003, "r_y2": 389.20004, "r_x3": 450.33136, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28336, "r_y0": 395.51868, "r_x1": 466.44269, "r_y1": 395.51868, "r_x2": 466.44269, "r_y2": 389.20004, "r_x3": 463.28336, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23535, "r_y0": 395.51868, "r_x1": 479.39468, "r_y1": 395.51868, "r_x2": 479.39468, "r_y2": 389.20004, "r_x3": 476.23535, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18735, "r_y0": 395.51868, "r_x1": 492.34668, "r_y1": 395.51868, "r_x2": 492.34668, "r_y2": 389.20004, "r_x3": 489.18735, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.13933999999995, "r_y0": 395.51868, "r_x1": 505.29868000000005, "r_y1": 395.51868, "r_x2": 505.29868000000005, "r_y2": 389.20004, "r_x3": 502.13933999999995, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09131, "r_y0": 395.51868, "r_x1": 521.41064, "r_y1": 395.51868, "r_x2": 521.41064, "r_y2": 389.20004, "r_x3": 515.09131, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04364, "r_y0": 395.51868, "r_x1": 534.13104, "r_y1": 395.51868, "r_x2": 534.13104, "r_y2": 389.20004, "r_x3": 528.04364, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 405.29327, "r_x1": 391.60071, "r_y1": 405.29327, "r_x2": 391.60071, "r_y2": 398.97464, "r_x3": 385.2814, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 405.29327, "r_x1": 404.84271, "r_y1": 405.29327, "r_x2": 404.84271, "r_y2": 398.97464, "r_x3": 398.52341, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 405.29327, "r_x1": 417.79535, "r_y1": 405.29327, "r_x2": 417.79535, "r_y2": 398.97464, "r_x3": 411.47604, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42719, "r_y0": 413.09326, "r_x1": 430.74648999999994, "r_y1": 413.09326, "r_x2": 430.74648999999994, "r_y2": 406.77463000000006, "r_x3": 424.42719, "r_y3": 406.77463000000006, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.86941999999993, "r_y0": 417.31302, "r_x1": 509.18871999999993, "r_y1": 417.31302, "r_x2": 509.18871999999993, "r_y2": 410.99438, "r_x3": 502.86941999999993, "r_y3": 410.99438, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35437, "r_y0": 386.44281, "r_x1": 430.99261, "r_y1": 386.44281, "r_x2": 430.99261, "r_y2": 381.77722, "r_x3": 384.35437, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.595001, "r_y0": 467.63492, "r_x1": 532.63049, "r_y1": 467.63492, "r_x2": 532.63049, "r_y2": 458.72836, "r_x3": 62.595001, "r_y3": 458.72836, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 501.24741, "r_x1": 64.448898, "r_y1": 501.24741, "r_x2": 64.448898, "r_y2": 491.39536, "r_x3": 50.112, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.006828, "r_y0": 501.24741, "r_x1": 163.7558, "r_y1": 501.24741, "r_x2": 163.7558, "r_y2": 491.39536, "r_x3": 74.006828, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 545.77992, "r_x1": 286.36499, "r_y1": 545.77992, "r_x2": 286.36499, "r_y2": 536.87337, "r_x3": 62.067001, "r_y3": 536.87337, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 557.73492, "r_x1": 211.15741, "r_y1": 557.73492, "r_x2": 211.15741, "r_y2": 548.82837, "r_x3": 50.112, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.10000999999997, "r_y0": 557.50578, "r_x1": 259.17453, "r_y1": 557.50578, "r_x2": 259.17453, "r_y2": 548.91803, "r_x3": 215.10000999999997, "r_y3": 548.91803, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73492, "r_x1": 286.36273, "r_y1": 557.73492, "r_x2": 286.36273, "r_y2": 548.82837, "r_x3": 263.12, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 569.68993, "r_x1": 286.36505, "r_y1": 569.68993, "r_x2": 286.36505, "r_y2": 560.78337, "r_x3": 50.112, "r_y3": 560.78337, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 581.6449299999999, "r_x1": 286.36508, "r_y1": 581.6449299999999, "r_x2": 286.36508, "r_y2": 572.73837, "r_x3": 50.112, "r_y3": 572.73837, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 593.59993, "r_x1": 286.36508, "r_y1": 593.59993, "r_x2": 286.36508, "r_y2": 584.69337, "r_x3": 50.112, "r_y3": 584.69337, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 605.55592, "r_x1": 286.36505, "r_y1": 605.55592, "r_x2": 286.36505, "r_y2": 596.64937, "r_x3": 50.112, "r_y3": 596.64937, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 617.51093, "r_x1": 286.36508, "r_y1": 617.51093, "r_x2": 286.36508, "r_y2": 608.60437, "r_x3": 50.112, "r_y3": 608.60437, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 629.46593, "r_x1": 286.36508, "r_y1": 629.46593, "r_x2": 286.36508, "r_y2": 620.55937, "r_x3": 50.112, "r_y3": 620.55937, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 641.42093, "r_x1": 286.36508, "r_y1": 641.42093, "r_x2": 286.36508, "r_y2": 632.51437, "r_x3": 50.112, "r_y3": 632.51437, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 653.37593, "r_x1": 286.36508, "r_y1": 653.37593, "r_x2": 286.36508, "r_y2": 644.46938, "r_x3": 50.112, "r_y3": 644.46938, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 665.33094, "r_x1": 286.36511, "r_y1": 665.33094, "r_x2": 286.36511, "r_y2": 656.42438, "r_x3": 50.112, "r_y3": 656.42438, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 677.28694, "r_x1": 286.36508, "r_y1": 677.28694, "r_x2": 286.36508, "r_y2": 668.38037, "r_x3": 50.112, "r_y3": 668.38037, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 689.24194, "r_x1": 286.36511, "r_y1": 689.24194, "r_x2": 286.36511, "r_y2": 680.33537, "r_x3": 50.112, "r_y3": 680.33537, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 701.196945, "r_x1": 286.36511, "r_y1": 701.196945, "r_x2": 286.36511, "r_y2": 692.290375, "r_x3": 50.112, "r_y3": 692.290375, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.1519470000001, "r_x1": 226.88833999999997, "r_y1": 713.1519470000001, "r_x2": 226.88833999999997, "r_y2": 704.245377, "r_x3": 50.112, "r_y3": 704.245377, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 501.45663, "r_x1": 316.07382, "r_y1": 501.45663, "r_x2": 316.07382, "r_y2": 490.70892, "r_x3": 308.862, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.68954, "r_y0": 501.45663, "r_x1": 460.84848, "r_y1": 501.45663, "r_x2": 460.84848, "r_y2": 490.70892, "r_x3": 325.68954, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 521.79993, "r_x1": 545.11505, "r_y1": 521.79993, "r_x2": 545.11505, "r_y2": 512.89337, "r_x3": 320.81699, "r_y3": 512.89337, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.75491, "r_x1": 545.11517, "r_y1": 533.75491, "r_x2": 545.11517, "r_y2": 524.84836, "r_x3": 308.862, "r_y3": 524.84836, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.70992, "r_x1": 545.11511, "r_y1": 545.70992, "r_x2": 545.11511, "r_y2": 536.80336, "r_x3": 308.862, "r_y3": 536.80336, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.6649199999999, "r_x1": 545.11505, "r_y1": 557.6649199999999, "r_x2": 545.11505, "r_y2": 548.75836, "r_x3": 308.862, "r_y3": 548.75836, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.61992, "r_x1": 545.11517, "r_y1": 569.61992, "r_x2": 545.11517, "r_y2": 560.71336, "r_x3": 308.862, "r_y3": 560.71336, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.57492, "r_x1": 545.11511, "r_y1": 581.57492, "r_x2": 545.11511, "r_y2": 572.66837, "r_x3": 308.862, "r_y3": 572.66837, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.53091, "r_x1": 545.11511, "r_y1": 593.53091, "r_x2": 545.11511, "r_y2": 584.62436, "r_x3": 308.862, "r_y3": 584.62436, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.48592, "r_x1": 400.46808, "r_y1": 605.48592, "r_x2": 400.46808, "r_y2": 596.57936, "r_x3": 308.862, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.37839, "r_y0": 605.48592, "r_x1": 545.11511, "r_y1": 605.48592, "r_x2": 545.11511, "r_y2": 596.57936, "r_x3": 408.37839, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.44092, "r_x1": 545.11505, "r_y1": 617.44092, "r_x2": 545.11505, "r_y2": 608.53436, "r_x3": 308.862, "r_y3": 608.53436, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.3959199999999, "r_x1": 545.11511, "r_y1": 629.3959199999999, "r_x2": 545.11511, "r_y2": 620.48936, "r_x3": 308.862, "r_y3": 620.48936, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.35092, "r_x1": 545.11505, "r_y1": 641.35092, "r_x2": 545.11505, "r_y2": 632.4443699999999, "r_x3": 308.862, "r_y3": 632.4443699999999, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.30592, "r_x1": 365.85803, "r_y1": 653.30592, "r_x2": 365.85803, "r_y2": 644.39937, "r_x3": 308.862, "r_y3": 644.39937, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 682.84664, "r_x1": 364.40585, "r_y1": 682.84664, "r_x2": 364.40585, "r_y2": 672.09892, "r_x3": 308.862, "r_y3": 672.09892, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.345, "r_y0": 701.977753, "r_x1": 323.80792, "r_y1": 701.977753, "r_x2": 323.80792, "r_y2": 693.9617920000001, "r_x3": 313.345, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05127, "r_y0": 701.977753, "r_x1": 545.10852, "r_y1": 701.977753, "r_x2": 545.10852, "r_y2": 693.9617920000001, "r_x3": 326.05127, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 712.936752, "r_x1": 545.1134, "r_y1": 712.936752, "r_x2": 545.1134, "r_y2": 704.920792, "r_x3": 328.78101, "r_y3": 704.920792, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 18, "label": "caption", "bbox": { "l": 53.811783000000005, "t": 208.23328000000004, "r": 385.93451, "b": 216.10645, "coord_origin": "TOPLEFT" }, "confidence": 0.5986505746841431, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 216.10645, "r_x1": 62.219952, "r_y1": 216.10645, "r_x2": 62.219952, "r_y2": 208.23328000000004, "r_x3": 53.811783000000005, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.424026, "r_y0": 216.10645, "r_x1": 385.93451, "r_y1": 216.10645, "r_x2": 385.93451, "r_y2": 208.23328000000004, "r_x3": 66.424026, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "section_header", "bbox": { "l": 53.811783000000005, "t": 94.28112999999996, "r": 284.34592, "b": 102.15430000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.46452972292900085, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 102.15430000000003, "r_x1": 284.34592, "r_y1": 102.15430000000003, "r_x2": 284.34592, "r_y2": 94.28112999999996, "r_x3": 53.811783000000005, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "section_header", "bbox": { "l": 304.83081, "t": 94.28112999999996, "r": 431.09119, "b": 102.15430000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.4629225730895996, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83081, "r_y0": 102.15430000000003, "r_x1": 431.09119, "r_y1": 102.15430000000003, "r_x2": 431.09119, "r_y2": 94.28112999999996, "r_x3": 304.83081, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "list_item", "bbox": { "l": 53.286037, "t": 78.68756000000008, "r": 61.550289, "b": 86.56073000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.5820134282112122, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.286037, "r_y0": 86.56073000000004, "r_x1": 61.550289, "r_y1": 86.56073000000004, "r_x2": 61.550289, "r_y2": 78.68756000000008, "r_x3": 53.286037, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "list_item", "bbox": { "l": 65.682419, "t": 78.68756000000008, "r": 499.55563, "b": 86.56073000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.541211724281311, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.682419, "r_y0": 86.56073000000004, "r_x1": 499.55563, "r_y1": 86.56073000000004, "r_x2": 499.55563, "r_y2": 78.68756000000008, "r_x3": 65.682419, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT" }, "confidence": 0.8824009299278259, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93285, "t": 222.18073000000004, "r": 241.04458999999997, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76489, "t": 222.18073000000004, "r": 284.50589, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.24990999999999, "t": 229.66594999999995, "r": 120.62018, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.36609, "t": 229.66594999999995, "r": 196.1071, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.10756, "t": 229.66594999999995, "r": 201.29247, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62408, "t": 229.66594999999995, "r": 219.99435, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.19814, "t": 229.66594999999995, "r": 244.75377, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.1142, "t": 229.66594999999995, "r": 266.48447, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38434, "t": 229.66594999999995, "r": 293.93997, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53052099999999, "t": 236.42584, "r": 162.7131, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.39731, "t": 236.42584, "r": 189.56456, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99026, "t": 236.42584, "r": 214.15752, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.87517, "t": 236.42584, "r": 237.45833000000002, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88446, "t": 236.42584, "r": 264.6358, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06134, "t": 236.42584, "r": 286.6445, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53052099999999, "t": 242.62048000000004, "r": 139.72253, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.10536, "t": 242.62048000000004, "r": 190.8567, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.69832, "t": 242.62048000000004, "r": 215.44965999999997, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.87517, "t": 242.62048000000004, "r": 237.45833000000002, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88446, "t": 242.62048000000004, "r": 264.6358, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06134, "t": 242.62048000000004, "r": 286.6445, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53052099999999, "t": 249.79845999999998, "r": 97.013, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.698288, "t": 249.58942000000002, "r": 103.03371, "b": 253.94732999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03389, "t": 249.79845999999998, "r": 128.96027, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.10536, "t": 248.81506000000002, "r": 190.8567, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28223, "t": 248.81506000000002, "r": 212.86539, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29153, "t": 248.81506000000002, "r": 240.04287999999997, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88446, "t": 248.81506000000002, "r": 264.6358, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.47742, "t": 248.81506000000002, "r": 289.22876, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53052099999999, "t": 257.28369, "r": 91.827637, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.052673, "t": 257.07465, "r": 93.219925, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.220474, "t": 257.28369, "r": 119.14685, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45073999999998, "t": 257.07465, "r": 129.88177, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.10536, "t": 256.30029, "r": 190.8567, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28223, "t": 256.30029, "r": 212.86539, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29153, "t": 256.30029, "r": 240.04287999999997, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88446, "t": 256.30029, "r": 264.6358, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.47742, "t": 256.30029, "r": 289.22876, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53052099999999, "t": 264.5108, "r": 60.715424, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.17654799999999, "t": 264.30175999999994, "r": 65.343796, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.344376, "t": 264.5108, "r": 122.38297000000001, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45073999999998, "t": 264.30175999999994, "r": 129.88177, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.10536, "t": 263.52739999999994, "r": 190.8567, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28223, "t": 263.52739999999994, "r": 212.86539, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29153, "t": 263.52739999999994, "r": 240.04287999999997, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88446, "t": 263.52739999999994, "r": 264.6358, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.47742, "t": 263.52739999999994, "r": 289.22876, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53052099999999, "t": 271.73785, "r": 107.38374, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99034, "t": 271.52881, "r": 109.74168000000002, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74204, "t": 271.73785, "r": 114.92695000000002, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.38793, "t": 271.52881, "r": 122.13927, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.13963, "t": 271.73785, "r": 127.32454000000001, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.39731, "t": 270.75446, "r": 189.56456, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28223, "t": 270.75446, "r": 212.86539, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58348, "t": 270.75446, "r": 238.75072999999998, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88446, "t": 270.75446, "r": 264.6358, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.47742, "t": 270.75446, "r": 289.22876, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53052099999999, "t": 279.01392, "r": 68.68605, "b": 283.37183, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.685814, "t": 279.22295999999994, "r": 110.16829999999999, "b": 283.40436, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.10536, "t": 277.98157000000003, "r": 190.8567, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99026, "t": 277.98157000000003, "r": 214.15752, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58348, "t": 277.98157000000003, "r": 238.75072999999998, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88446, "t": 277.98157000000003, "r": 264.6358, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.76938, "t": 277.98157000000003, "r": 287.93661, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.61508, "t": 286.45004, "r": 174.79999, "b": 290.63141, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.10536, "t": 285.46667, "r": 190.8567, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.69832, "t": 285.46667, "r": 215.44965999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29153, "t": 285.46667, "r": 240.04287999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.76506, "t": 285.46667, "r": 265.75204, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.47742, "t": 285.46667, "r": 289.22876, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 16, "label": "caption", "bbox": { "l": 380.42731, "t": 292.30426, "r": 549.42175, "b": 298.60284, "coord_origin": "TOPLEFT" }, "confidence": 0.7499915957450867, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.42731, "r_y0": 298.60284, "r_x1": 549.42175, "r_y1": 298.60284, "r_x2": 549.42175, "r_y2": 292.30426, "r_x3": 380.42731, "r_y3": 292.30426, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "table", "bbox": { "l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8899767994880676, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.04861, "t": 221.62415, "r": 542.00018, "b": 226.68933000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82193, "t": 227.83416999999997, "r": 507.2258, "b": 232.89935000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.2442, "t": 236.74712999999997, "r": 400.74588, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.74643, "t": 236.74712999999997, "r": 404.64523, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.6463, "t": 236.74712999999997, "r": 407.34631, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.09671, "t": 221.57446000000004, "r": 438.0145, "b": 226.63964999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18323, "t": 236.74712999999997, "r": 440.98778999999996, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38254, "t": 236.74712999999997, "r": 482.48465000000004, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.92578, "t": 236.74712999999997, "r": 530.73035, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11493, "t": 244.61084000000005, "r": 355.6532, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65427, "t": 244.61084000000005, "r": 364.65607, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.24661, "t": 244.91327, "r": 400.75238, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.7529, "t": 244.91327, "r": 403.75531, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.81838999999997, "t": 244.91327, "r": 437.32708999999994, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.52859, "t": 244.91327, "r": 478.40103, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.97552, "t": 244.91327, "r": 483.55001999999996, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.44824, "t": 244.91327, "r": 531.46967, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11493, "t": 253.68451000000005, "r": 325.62674, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.24661, "t": 253.68451000000005, "r": 400.75238, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.7529, "t": 253.68451000000005, "r": 403.75531, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.81838999999997, "t": 253.68451000000005, "r": 437.32708999999994, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.43579000000005, "t": 253.68451000000005, "r": 482.54831, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29065, "t": 253.68451000000005, "r": 530.80981, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11493, "t": 261.54822, "r": 322.62866, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43222, "t": 261.54822, "r": 400.73563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73456, "t": 261.54822, "r": 403.73697, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.73804, "t": 261.54822, "r": 405.53625, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7016, "t": 261.54822, "r": 438.80563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.55533, "t": 261.54822, "r": 482.07043, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.01862, "t": 261.54822, "r": 529.53375, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11493, "t": 269.64148, "r": 356.24771, "b": 274.70667000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43222, "t": 270.31946000000005, "r": 400.73563, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73456, "t": 270.31946000000005, "r": 403.73697, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.73804, "t": 270.31946000000005, "r": 405.53625, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.02802, "t": 270.31946000000005, "r": 436.4280099999999, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83099000000004, "t": 270.31946000000005, "r": 482.35013, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.01862, "t": 270.31946000000005, "r": 529.53375, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11493, "t": 278.48572, "r": 373.35764, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.24661, "t": 278.48572, "r": 403.75531, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.51599, "t": 278.48572, "r": 437.02469, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.7142, "t": 278.48572, "r": 484.73965000000004, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99463, "t": 278.48572, "r": 534.02008, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 6, "label": "caption", "bbox": { "l": 50.112, "t": 320.87735, "r": 545.11377, "b": 365.64987, "coord_origin": "TOPLEFT" }, "confidence": 0.9140303134918213, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 329.78391, "r_x1": 86.864021, "r_y1": 329.78391, "r_x2": 86.864021, "r_y2": 320.87735, "r_x3": 50.112, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.917542, "r_y0": 329.78391, "r_x1": 545.11371, "r_y1": 329.78391, "r_x2": 545.11371, "r_y2": 320.87735, "r_x3": 93.917542, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 341.73889, "r_x1": 545.11371, "r_y1": 341.73889, "r_x2": 545.11371, "r_y2": 332.83233999999993, "r_x3": 50.112, "r_y3": 332.83233999999993, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 353.69388, "r_x1": 545.11377, "r_y1": 353.69388, "r_x2": 545.11377, "r_y2": 344.78732, "r_x3": 50.112, "r_y3": 344.78732, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.64987, "r_x1": 139.79532, "r_y1": 365.64987, "r_x2": 139.79532, "r_y2": 356.74332, "r_x3": 50.112, "r_y3": 356.74332, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "picture", "bbox": { "l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT" }, "confidence": 0.805853009223938, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26282, "r_y0": 386.44281, "r_x1": 342.07819, "r_y1": 386.44281, "r_x2": 342.07819, "r_y2": 381.77722, "r_x3": 220.26282, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 167, "label": "text", "bbox": { "l": 220.26282, "t": 381.77722, "r": 342.07819, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26282, "r_y0": 386.44281, "r_x1": 342.07819, "r_y1": 386.44281, "r_x2": 342.07819, "r_y2": 381.77722, "r_x3": 220.26282, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 11, "label": "picture", "bbox": { "l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT" }, "confidence": 0.8308426737785339, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.715248, "r_y0": 386.44281, "r_x1": 85.657333, "r_y1": 386.44281, "r_x2": 85.657333, "r_y2": 381.77722, "r_x3": 53.715248, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 168, "label": "text", "bbox": { "l": 53.715248, "t": 381.77722, "r": 85.657333, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.715248, "r_y0": 386.44281, "r_x1": 85.657333, "r_y1": 386.44281, "r_x2": 85.657333, "r_y2": 381.77722, "r_x3": 53.715248, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 13, "label": "picture", "bbox": { "l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT" }, "confidence": 0.7881615161895752, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 406.87158, "r_x1": 443.69870000000003, "r_y1": 406.87158, "r_x2": 443.69870000000003, "r_y2": 400.55295, "r_x3": 437.37939, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 406.87158, "r_x1": 456.6513100000001, "r_y1": 406.87158, "r_x2": 456.6513100000001, "r_y2": 400.55295, "r_x3": 450.33203, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 406.87158, "r_x1": 469.60394, "r_y1": 406.87158, "r_x2": 469.60394, "r_y2": 400.55295, "r_x3": 463.28464, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23724000000004, "r_y0": 406.87158, "r_x1": 482.5565500000001, "r_y1": 406.87158, "r_x2": 482.5565500000001, "r_y2": 400.55295, "r_x3": 476.23724000000004, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18988, "r_y0": 406.87158, "r_x1": 495.50916, "r_y1": 406.87158, "r_x2": 495.50916, "r_y2": 400.55295, "r_x3": 489.18988, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14251999999993, "r_y0": 406.87158, "r_x1": 508.46178999999995, "r_y1": 406.87158, "r_x2": 508.46178999999995, "r_y2": 400.55295, "r_x3": 502.14251999999993, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09509, "r_y0": 406.87158, "r_x1": 521.41443, "r_y1": 406.87158, "r_x2": 521.41443, "r_y2": 400.55295, "r_x3": 515.09509, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 417.35699, "r_x1": 391.60071, "r_y1": 417.35699, "r_x2": 391.60071, "r_y2": 411.03836000000007, "r_x3": 385.2814, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 417.35699, "r_x1": 404.84271, "r_y1": 417.35699, "r_x2": 404.84271, "r_y2": 411.03836000000007, "r_x3": 398.52341, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 417.35699, "r_x1": 417.79535, "r_y1": 417.35699, "r_x2": 417.79535, "r_y2": 411.03836000000007, "r_x3": 411.47604, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 417.35699, "r_x1": 443.69870000000003, "r_y1": 417.35699, "r_x2": 443.69870000000003, "r_y2": 411.03836000000007, "r_x3": 437.37939, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 417.35699, "r_x1": 456.6513100000001, "r_y1": 417.35699, "r_x2": 456.6513100000001, "r_y2": 411.03836000000007, "r_x3": 450.33203, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 417.35699, "r_x1": 469.60394, "r_y1": 417.35699, "r_x2": 469.60394, "r_y2": 411.03836000000007, "r_x3": 463.28464, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 427.38834, "r_x1": 391.60071, "r_y1": 427.38834, "r_x2": 391.60071, "r_y2": 421.0697, "r_x3": 385.2814, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 427.38834, "r_x1": 404.84271, "r_y1": 427.38834, "r_x2": 404.84271, "r_y2": 421.0697, "r_x3": 398.52341, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 427.38834, "r_x1": 417.79532, "r_y1": 427.38834, "r_x2": 417.79532, "r_y2": 421.0697, "r_x3": 411.47604, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 427.38834, "r_x1": 430.74796, "r_y1": 427.38834, "r_x2": 430.74796, "r_y2": 421.0697, "r_x3": 424.42865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 427.38834, "r_x1": 443.70056, "r_y1": 427.38834, "r_x2": 443.70056, "r_y2": 421.0697, "r_x3": 437.38129, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 427.38834, "r_x1": 456.65319999999997, "r_y1": 427.38834, "r_x2": 456.65319999999997, "r_y2": 421.0697, "r_x3": 450.33389000000005, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 427.38834, "r_x1": 469.6058, "r_y1": 427.38834, "r_x2": 469.6058, "r_y2": 421.0697, "r_x3": 463.2865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 427.38834, "r_x1": 482.55841, "r_y1": 427.38834, "r_x2": 482.55841, "r_y2": 421.0697, "r_x3": 476.23914, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 427.38834, "r_x1": 495.51105, "r_y1": 427.38834, "r_x2": 495.51105, "r_y2": 421.0697, "r_x3": 489.1917700000001, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 427.38834, "r_x1": 508.46368, "r_y1": 427.38834, "r_x2": 508.46368, "r_y2": 421.0697, "r_x3": 502.14438, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 427.38834, "r_x1": 521.41632, "r_y1": 427.38834, "r_x2": 521.41632, "r_y2": 421.0697, "r_x3": 515.09705, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 427.38834, "r_x1": 534.3689, "r_y1": 427.38834, "r_x2": 534.3689, "r_y2": 421.0697, "r_x3": 528.04962, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 438.36295, "r_x1": 391.60071, "r_y1": 438.36295, "r_x2": 391.60071, "r_y2": 432.04431, "r_x3": 385.2814, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 438.36295, "r_x1": 404.84271, "r_y1": 438.36295, "r_x2": 404.84271, "r_y2": 432.04431, "r_x3": 398.52341, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 438.36295, "r_x1": 417.79532, "r_y1": 438.36295, "r_x2": 417.79532, "r_y2": 432.04431, "r_x3": 411.47604, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 438.36295, "r_x1": 430.74796, "r_y1": 438.36295, "r_x2": 430.74796, "r_y2": 432.04431, "r_x3": 424.42865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 438.36295, "r_x1": 443.70056, "r_y1": 438.36295, "r_x2": 443.70056, "r_y2": 432.04431, "r_x3": 437.38129, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 438.36295, "r_x1": 456.65319999999997, "r_y1": 438.36295, "r_x2": 456.65319999999997, "r_y2": 432.04431, "r_x3": 450.33389000000005, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 438.36295, "r_x1": 469.6058, "r_y1": 438.36295, "r_x2": 469.6058, "r_y2": 432.04431, "r_x3": 463.2865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 438.36295, "r_x1": 482.55841, "r_y1": 438.36295, "r_x2": 482.55841, "r_y2": 432.04431, "r_x3": 476.23914, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 438.36295, "r_x1": 495.51105, "r_y1": 438.36295, "r_x2": 495.51105, "r_y2": 432.04431, "r_x3": 489.1917700000001, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 438.36295, "r_x1": 508.46368, "r_y1": 438.36295, "r_x2": 508.46368, "r_y2": 432.04431, "r_x3": 502.14438, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 438.36295, "r_x1": 521.41632, "r_y1": 438.36295, "r_x2": 521.41632, "r_y2": 432.04431, "r_x3": 515.09705, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 438.36295, "r_x1": 534.3689, "r_y1": 438.36295, "r_x2": 534.3689, "r_y2": 432.04431, "r_x3": 528.04962, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 395.51868, "r_x1": 388.44073, "r_y1": 395.51868, "r_x2": 388.44073, "r_y2": 389.20004, "r_x3": 385.2814, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 395.51868, "r_x1": 401.68274, "r_y1": 395.51868, "r_x2": 401.68274, "r_y2": 389.20004, "r_x3": 398.52341, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.4754, "r_y0": 395.51868, "r_x1": 414.63474, "r_y1": 395.51868, "r_x2": 414.63474, "r_y2": 389.20004, "r_x3": 411.4754, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.4274, "r_y0": 395.51868, "r_x1": 427.58673, "r_y1": 395.51868, "r_x2": 427.58673, "r_y2": 389.20004, "r_x3": 424.4274, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 395.51868, "r_x1": 440.53870000000006, "r_y1": 395.51868, "r_x2": 440.53870000000006, "r_y2": 389.20004, "r_x3": 437.37939, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33136, "r_y0": 395.51868, "r_x1": 453.49069000000003, "r_y1": 395.51868, "r_x2": 453.49069000000003, "r_y2": 389.20004, "r_x3": 450.33136, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28336, "r_y0": 395.51868, "r_x1": 466.44269, "r_y1": 395.51868, "r_x2": 466.44269, "r_y2": 389.20004, "r_x3": 463.28336, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23535, "r_y0": 395.51868, "r_x1": 479.39468, "r_y1": 395.51868, "r_x2": 479.39468, "r_y2": 389.20004, "r_x3": 476.23535, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18735, "r_y0": 395.51868, "r_x1": 492.34668, "r_y1": 395.51868, "r_x2": 492.34668, "r_y2": 389.20004, "r_x3": 489.18735, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.13933999999995, "r_y0": 395.51868, "r_x1": 505.29868000000005, "r_y1": 395.51868, "r_x2": 505.29868000000005, "r_y2": 389.20004, "r_x3": 502.13933999999995, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09131, "r_y0": 395.51868, "r_x1": 521.41064, "r_y1": 395.51868, "r_x2": 521.41064, "r_y2": 389.20004, "r_x3": 515.09131, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04364, "r_y0": 395.51868, "r_x1": 534.13104, "r_y1": 395.51868, "r_x2": 534.13104, "r_y2": 389.20004, "r_x3": 528.04364, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 405.29327, "r_x1": 391.60071, "r_y1": 405.29327, "r_x2": 391.60071, "r_y2": 398.97464, "r_x3": 385.2814, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 405.29327, "r_x1": 404.84271, "r_y1": 405.29327, "r_x2": 404.84271, "r_y2": 398.97464, "r_x3": 398.52341, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 405.29327, "r_x1": 417.79535, "r_y1": 405.29327, "r_x2": 417.79535, "r_y2": 398.97464, "r_x3": 411.47604, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42719, "r_y0": 413.09326, "r_x1": 430.74648999999994, "r_y1": 413.09326, "r_x2": 430.74648999999994, "r_y2": 406.77463000000006, "r_x3": 424.42719, "r_y3": 406.77463000000006, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.86941999999993, "r_y0": 417.31302, "r_x1": 509.18871999999993, "r_y1": 417.31302, "r_x2": 509.18871999999993, "r_y2": 410.99438, "r_x3": 502.86941999999993, "r_y3": 410.99438, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35437, "r_y0": 386.44281, "r_x1": 430.99261, "r_y1": 386.44281, "r_x2": 430.99261, "r_y2": 381.77722, "r_x3": 384.35437, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 169, "label": "text", "bbox": { "l": 437.37939, "t": 400.55295, "r": 443.69870000000003, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 406.87158, "r_x1": 443.69870000000003, "r_y1": 406.87158, "r_x2": 443.69870000000003, "r_y2": 400.55295, "r_x3": 437.37939, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 170, "label": "text", "bbox": { "l": 450.33203, "t": 400.55295, "r": 456.6513100000001, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 406.87158, "r_x1": 456.6513100000001, "r_y1": 406.87158, "r_x2": 456.6513100000001, "r_y2": 400.55295, "r_x3": 450.33203, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 171, "label": "text", "bbox": { "l": 463.28464, "t": 400.55295, "r": 469.60394, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 406.87158, "r_x1": 469.60394, "r_y1": 406.87158, "r_x2": 469.60394, "r_y2": 400.55295, "r_x3": 463.28464, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 172, "label": "text", "bbox": { "l": 476.23724000000004, "t": 400.55295, "r": 482.5565500000001, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23724000000004, "r_y0": 406.87158, "r_x1": 482.5565500000001, "r_y1": 406.87158, "r_x2": 482.5565500000001, "r_y2": 400.55295, "r_x3": 476.23724000000004, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 173, "label": "text", "bbox": { "l": 489.18988, "t": 400.55295, "r": 495.50916, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18988, "r_y0": 406.87158, "r_x1": 495.50916, "r_y1": 406.87158, "r_x2": 495.50916, "r_y2": 400.55295, "r_x3": 489.18988, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 174, "label": "text", "bbox": { "l": 502.14251999999993, "t": 400.55295, "r": 508.46178999999995, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14251999999993, "r_y0": 406.87158, "r_x1": 508.46178999999995, "r_y1": 406.87158, "r_x2": 508.46178999999995, "r_y2": 400.55295, "r_x3": 502.14251999999993, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 175, "label": "text", "bbox": { "l": 515.09509, "t": 400.55295, "r": 521.41443, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09509, "r_y0": 406.87158, "r_x1": 521.41443, "r_y1": 406.87158, "r_x2": 521.41443, "r_y2": 400.55295, "r_x3": 515.09509, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 176, "label": "text", "bbox": { "l": 385.2814, "t": 411.03836000000007, "r": 391.60071, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 417.35699, "r_x1": 391.60071, "r_y1": 417.35699, "r_x2": 391.60071, "r_y2": 411.03836000000007, "r_x3": 385.2814, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 177, "label": "text", "bbox": { "l": 398.52341, "t": 411.03836000000007, "r": 404.84271, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 417.35699, "r_x1": 404.84271, "r_y1": 417.35699, "r_x2": 404.84271, "r_y2": 411.03836000000007, "r_x3": 398.52341, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 178, "label": "text", "bbox": { "l": 411.47604, "t": 411.03836000000007, "r": 417.79535, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 417.35699, "r_x1": 417.79535, "r_y1": 417.35699, "r_x2": 417.79535, "r_y2": 411.03836000000007, "r_x3": 411.47604, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 179, "label": "text", "bbox": { "l": 437.37939, "t": 411.03836000000007, "r": 443.69870000000003, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 417.35699, "r_x1": 443.69870000000003, "r_y1": 417.35699, "r_x2": 443.69870000000003, "r_y2": 411.03836000000007, "r_x3": 437.37939, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 180, "label": "text", "bbox": { "l": 450.33203, "t": 411.03836000000007, "r": 456.6513100000001, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 417.35699, "r_x1": 456.6513100000001, "r_y1": 417.35699, "r_x2": 456.6513100000001, "r_y2": 411.03836000000007, "r_x3": 450.33203, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 181, "label": "text", "bbox": { "l": 463.28464, "t": 411.03836000000007, "r": 469.60394, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 417.35699, "r_x1": 469.60394, "r_y1": 417.35699, "r_x2": 469.60394, "r_y2": 411.03836000000007, "r_x3": 463.28464, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 182, "label": "text", "bbox": { "l": 385.2814, "t": 421.0697, "r": 391.60071, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 427.38834, "r_x1": 391.60071, "r_y1": 427.38834, "r_x2": 391.60071, "r_y2": 421.0697, "r_x3": 385.2814, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 183, "label": "text", "bbox": { "l": 398.52341, "t": 421.0697, "r": 404.84271, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 427.38834, "r_x1": 404.84271, "r_y1": 427.38834, "r_x2": 404.84271, "r_y2": 421.0697, "r_x3": 398.52341, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 184, "label": "text", "bbox": { "l": 411.47604, "t": 421.0697, "r": 417.79532, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 427.38834, "r_x1": 417.79532, "r_y1": 427.38834, "r_x2": 417.79532, "r_y2": 421.0697, "r_x3": 411.47604, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 185, "label": "text", "bbox": { "l": 424.42865, "t": 421.0697, "r": 430.74796, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 427.38834, "r_x1": 430.74796, "r_y1": 427.38834, "r_x2": 430.74796, "r_y2": 421.0697, "r_x3": 424.42865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 186, "label": "text", "bbox": { "l": 437.38129, "t": 421.0697, "r": 443.70056, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 427.38834, "r_x1": 443.70056, "r_y1": 427.38834, "r_x2": 443.70056, "r_y2": 421.0697, "r_x3": 437.38129, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 187, "label": "text", "bbox": { "l": 450.33389000000005, "t": 421.0697, "r": 456.65319999999997, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 427.38834, "r_x1": 456.65319999999997, "r_y1": 427.38834, "r_x2": 456.65319999999997, "r_y2": 421.0697, "r_x3": 450.33389000000005, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 188, "label": "text", "bbox": { "l": 463.2865, "t": 421.0697, "r": 469.6058, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 427.38834, "r_x1": 469.6058, "r_y1": 427.38834, "r_x2": 469.6058, "r_y2": 421.0697, "r_x3": 463.2865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 189, "label": "text", "bbox": { "l": 476.23914, "t": 421.0697, "r": 482.55841, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 427.38834, "r_x1": 482.55841, "r_y1": 427.38834, "r_x2": 482.55841, "r_y2": 421.0697, "r_x3": 476.23914, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 190, "label": "text", "bbox": { "l": 489.1917700000001, "t": 421.0697, "r": 495.51105, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 427.38834, "r_x1": 495.51105, "r_y1": 427.38834, "r_x2": 495.51105, "r_y2": 421.0697, "r_x3": 489.1917700000001, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 191, "label": "text", "bbox": { "l": 502.14438, "t": 421.0697, "r": 508.46368, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 427.38834, "r_x1": 508.46368, "r_y1": 427.38834, "r_x2": 508.46368, "r_y2": 421.0697, "r_x3": 502.14438, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 192, "label": "text", "bbox": { "l": 515.09705, "t": 421.0697, "r": 521.41632, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 427.38834, "r_x1": 521.41632, "r_y1": 427.38834, "r_x2": 521.41632, "r_y2": 421.0697, "r_x3": 515.09705, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 193, "label": "text", "bbox": { "l": 528.04962, "t": 421.0697, "r": 534.3689, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 427.38834, "r_x1": 534.3689, "r_y1": 427.38834, "r_x2": 534.3689, "r_y2": 421.0697, "r_x3": 528.04962, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 194, "label": "text", "bbox": { "l": 385.2814, "t": 432.04431, "r": 391.60071, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 438.36295, "r_x1": 391.60071, "r_y1": 438.36295, "r_x2": 391.60071, "r_y2": 432.04431, "r_x3": 385.2814, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 195, "label": "text", "bbox": { "l": 398.52341, "t": 432.04431, "r": 404.84271, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 438.36295, "r_x1": 404.84271, "r_y1": 438.36295, "r_x2": 404.84271, "r_y2": 432.04431, "r_x3": 398.52341, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 196, "label": "text", "bbox": { "l": 411.47604, "t": 432.04431, "r": 417.79532, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 438.36295, "r_x1": 417.79532, "r_y1": 438.36295, "r_x2": 417.79532, "r_y2": 432.04431, "r_x3": 411.47604, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 197, "label": "text", "bbox": { "l": 424.42865, "t": 432.04431, "r": 430.74796, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 438.36295, "r_x1": 430.74796, "r_y1": 438.36295, "r_x2": 430.74796, "r_y2": 432.04431, "r_x3": 424.42865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 198, "label": "text", "bbox": { "l": 437.38129, "t": 432.04431, "r": 443.70056, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 438.36295, "r_x1": 443.70056, "r_y1": 438.36295, "r_x2": 443.70056, "r_y2": 432.04431, "r_x3": 437.38129, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 199, "label": "text", "bbox": { "l": 450.33389000000005, "t": 432.04431, "r": 456.65319999999997, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 438.36295, "r_x1": 456.65319999999997, "r_y1": 438.36295, "r_x2": 456.65319999999997, "r_y2": 432.04431, "r_x3": 450.33389000000005, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 200, "label": "text", "bbox": { "l": 463.2865, "t": 432.04431, "r": 469.6058, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 438.36295, "r_x1": 469.6058, "r_y1": 438.36295, "r_x2": 469.6058, "r_y2": 432.04431, "r_x3": 463.2865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 201, "label": "text", "bbox": { "l": 476.23914, "t": 432.04431, "r": 482.55841, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 438.36295, "r_x1": 482.55841, "r_y1": 438.36295, "r_x2": 482.55841, "r_y2": 432.04431, "r_x3": 476.23914, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 202, "label": "text", "bbox": { "l": 489.1917700000001, "t": 432.04431, "r": 495.51105, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 438.36295, "r_x1": 495.51105, "r_y1": 438.36295, "r_x2": 495.51105, "r_y2": 432.04431, "r_x3": 489.1917700000001, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 203, "label": "text", "bbox": { "l": 502.14438, "t": 432.04431, "r": 508.46368, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 438.36295, "r_x1": 508.46368, "r_y1": 438.36295, "r_x2": 508.46368, "r_y2": 432.04431, "r_x3": 502.14438, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 204, "label": "text", "bbox": { "l": 515.09705, "t": 432.04431, "r": 521.41632, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 438.36295, "r_x1": 521.41632, "r_y1": 438.36295, "r_x2": 521.41632, "r_y2": 432.04431, "r_x3": 515.09705, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 205, "label": "text", "bbox": { "l": 528.04962, "t": 432.04431, "r": 534.3689, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 438.36295, "r_x1": 534.3689, "r_y1": 438.36295, "r_x2": 534.3689, "r_y2": 432.04431, "r_x3": 528.04962, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 206, "label": "text", "bbox": { "l": 385.2814, "t": 389.20004, "r": 388.44073, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 395.51868, "r_x1": 388.44073, "r_y1": 395.51868, "r_x2": 388.44073, "r_y2": 389.20004, "r_x3": 385.2814, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 207, "label": "text", "bbox": { "l": 398.52341, "t": 389.20004, "r": 401.68274, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 395.51868, "r_x1": 401.68274, "r_y1": 395.51868, "r_x2": 401.68274, "r_y2": 389.20004, "r_x3": 398.52341, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 208, "label": "text", "bbox": { "l": 411.4754, "t": 389.20004, "r": 414.63474, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.4754, "r_y0": 395.51868, "r_x1": 414.63474, "r_y1": 395.51868, "r_x2": 414.63474, "r_y2": 389.20004, "r_x3": 411.4754, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 209, "label": "text", "bbox": { "l": 424.4274, "t": 389.20004, "r": 427.58673, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.4274, "r_y0": 395.51868, "r_x1": 427.58673, "r_y1": 395.51868, "r_x2": 427.58673, "r_y2": 389.20004, "r_x3": 424.4274, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 210, "label": "text", "bbox": { "l": 437.37939, "t": 389.20004, "r": 440.53870000000006, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 395.51868, "r_x1": 440.53870000000006, "r_y1": 395.51868, "r_x2": 440.53870000000006, "r_y2": 389.20004, "r_x3": 437.37939, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 211, "label": "text", "bbox": { "l": 450.33136, "t": 389.20004, "r": 453.49069000000003, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33136, "r_y0": 395.51868, "r_x1": 453.49069000000003, "r_y1": 395.51868, "r_x2": 453.49069000000003, "r_y2": 389.20004, "r_x3": 450.33136, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 212, "label": "text", "bbox": { "l": 463.28336, "t": 389.20004, "r": 466.44269, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28336, "r_y0": 395.51868, "r_x1": 466.44269, "r_y1": 395.51868, "r_x2": 466.44269, "r_y2": 389.20004, "r_x3": 463.28336, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 213, "label": "text", "bbox": { "l": 476.23535, "t": 389.20004, "r": 479.39468, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23535, "r_y0": 395.51868, "r_x1": 479.39468, "r_y1": 395.51868, "r_x2": 479.39468, "r_y2": 389.20004, "r_x3": 476.23535, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 214, "label": "text", "bbox": { "l": 489.18735, "t": 389.20004, "r": 492.34668, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18735, "r_y0": 395.51868, "r_x1": 492.34668, "r_y1": 395.51868, "r_x2": 492.34668, "r_y2": 389.20004, "r_x3": 489.18735, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 215, "label": "text", "bbox": { "l": 502.13933999999995, "t": 389.20004, "r": 505.29868000000005, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.13933999999995, "r_y0": 395.51868, "r_x1": 505.29868000000005, "r_y1": 395.51868, "r_x2": 505.29868000000005, "r_y2": 389.20004, "r_x3": 502.13933999999995, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 216, "label": "text", "bbox": { "l": 515.09131, "t": 389.20004, "r": 521.41064, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09131, "r_y0": 395.51868, "r_x1": 521.41064, "r_y1": 395.51868, "r_x2": 521.41064, "r_y2": 389.20004, "r_x3": 515.09131, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 217, "label": "text", "bbox": { "l": 528.04364, "t": 389.20004, "r": 534.13104, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04364, "r_y0": 395.51868, "r_x1": 534.13104, "r_y1": 395.51868, "r_x2": 534.13104, "r_y2": 389.20004, "r_x3": 528.04364, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 218, "label": "text", "bbox": { "l": 385.2814, "t": 398.97464, "r": 391.60071, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 405.29327, "r_x1": 391.60071, "r_y1": 405.29327, "r_x2": 391.60071, "r_y2": 398.97464, "r_x3": 385.2814, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 219, "label": "text", "bbox": { "l": 398.52341, "t": 398.97464, "r": 404.84271, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 405.29327, "r_x1": 404.84271, "r_y1": 405.29327, "r_x2": 404.84271, "r_y2": 398.97464, "r_x3": 398.52341, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 220, "label": "text", "bbox": { "l": 411.47604, "t": 398.97464, "r": 417.79535, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 405.29327, "r_x1": 417.79535, "r_y1": 405.29327, "r_x2": 417.79535, "r_y2": 398.97464, "r_x3": 411.47604, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 221, "label": "text", "bbox": { "l": 424.42719, "t": 406.77463000000006, "r": 430.74648999999994, "b": 413.09326, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42719, "r_y0": 413.09326, "r_x1": 430.74648999999994, "r_y1": 413.09326, "r_x2": 430.74648999999994, "r_y2": 406.77463000000006, "r_x3": 424.42719, "r_y3": 406.77463000000006, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 222, "label": "text", "bbox": { "l": 502.86941999999993, "t": 410.99438, "r": 509.18871999999993, "b": 417.31302, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.86941999999993, "r_y0": 417.31302, "r_x1": 509.18871999999993, "r_y1": 417.31302, "r_x2": 509.18871999999993, "r_y2": 410.99438, "r_x3": 502.86941999999993, "r_y3": 410.99438, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 223, "label": "text", "bbox": { "l": 384.35437, "t": 381.77722, "r": 430.99261, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35437, "r_y0": 386.44281, "r_x1": 430.99261, "r_y1": 386.44281, "r_x2": 430.99261, "r_y2": 381.77722, "r_x3": 384.35437, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 5, "label": "caption", "bbox": { "l": 62.595001, "t": 458.72836, "r": 532.63049, "b": 467.63492, "coord_origin": "TOPLEFT" }, "confidence": 0.9153602719306946, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.595001, "r_y0": 467.63492, "r_x1": 532.63049, "r_y1": 467.63492, "r_x2": 532.63049, "r_y2": 458.72836, "r_x3": 62.595001, "r_y3": 458.72836, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "section_header", "bbox": { "l": 50.112, "t": 491.39536, "r": 163.7558, "b": 501.24741, "coord_origin": "TOPLEFT" }, "confidence": 0.9561247229576111, "cells": [ { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 501.24741, "r_x1": 64.448898, "r_y1": 501.24741, "r_x2": 64.448898, "r_y2": 491.39536, "r_x3": 50.112, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.006828, "r_y0": 501.24741, "r_x1": 163.7558, "r_y1": 501.24741, "r_x2": 163.7558, "r_y2": 491.39536, "r_x3": 74.006828, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 536.87337, "r": 286.36511, "b": 713.1519470000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9852361679077148, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 545.77992, "r_x1": 286.36499, "r_y1": 545.77992, "r_x2": 286.36499, "r_y2": 536.87337, "r_x3": 62.067001, "r_y3": 536.87337, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 557.73492, "r_x1": 211.15741, "r_y1": 557.73492, "r_x2": 211.15741, "r_y2": 548.82837, "r_x3": 50.112, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.10000999999997, "r_y0": 557.50578, "r_x1": 259.17453, "r_y1": 557.50578, "r_x2": 259.17453, "r_y2": 548.91803, "r_x3": 215.10000999999997, "r_y3": 548.91803, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73492, "r_x1": 286.36273, "r_y1": 557.73492, "r_x2": 286.36273, "r_y2": 548.82837, "r_x3": 263.12, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 569.68993, "r_x1": 286.36505, "r_y1": 569.68993, "r_x2": 286.36505, "r_y2": 560.78337, "r_x3": 50.112, "r_y3": 560.78337, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 581.6449299999999, "r_x1": 286.36508, "r_y1": 581.6449299999999, "r_x2": 286.36508, "r_y2": 572.73837, "r_x3": 50.112, "r_y3": 572.73837, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 593.59993, "r_x1": 286.36508, "r_y1": 593.59993, "r_x2": 286.36508, "r_y2": 584.69337, "r_x3": 50.112, "r_y3": 584.69337, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 605.55592, "r_x1": 286.36505, "r_y1": 605.55592, "r_x2": 286.36505, "r_y2": 596.64937, "r_x3": 50.112, "r_y3": 596.64937, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 617.51093, "r_x1": 286.36508, "r_y1": 617.51093, "r_x2": 286.36508, "r_y2": 608.60437, "r_x3": 50.112, "r_y3": 608.60437, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 629.46593, "r_x1": 286.36508, "r_y1": 629.46593, "r_x2": 286.36508, "r_y2": 620.55937, "r_x3": 50.112, "r_y3": 620.55937, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 641.42093, "r_x1": 286.36508, "r_y1": 641.42093, "r_x2": 286.36508, "r_y2": 632.51437, "r_x3": 50.112, "r_y3": 632.51437, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 653.37593, "r_x1": 286.36508, "r_y1": 653.37593, "r_x2": 286.36508, "r_y2": 644.46938, "r_x3": 50.112, "r_y3": 644.46938, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 665.33094, "r_x1": 286.36511, "r_y1": 665.33094, "r_x2": 286.36511, "r_y2": 656.42438, "r_x3": 50.112, "r_y3": 656.42438, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 677.28694, "r_x1": 286.36508, "r_y1": 677.28694, "r_x2": 286.36508, "r_y2": 668.38037, "r_x3": 50.112, "r_y3": 668.38037, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 689.24194, "r_x1": 286.36511, "r_y1": 689.24194, "r_x2": 286.36511, "r_y2": 680.33537, "r_x3": 50.112, "r_y3": 680.33537, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 701.196945, "r_x1": 286.36511, "r_y1": 701.196945, "r_x2": 286.36511, "r_y2": 692.290375, "r_x3": 50.112, "r_y3": 692.290375, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.1519470000001, "r_x1": 226.88833999999997, "r_y1": 713.1519470000001, "r_x2": 226.88833999999997, "r_y2": 704.245377, "r_x3": 50.112, "r_y3": 704.245377, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 308.862, "t": 490.70892, "r": 460.84848, "b": 501.45663, "coord_origin": "TOPLEFT" }, "confidence": 0.9436525702476501, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 501.45663, "r_x1": 316.07382, "r_y1": 501.45663, "r_x2": 316.07382, "r_y2": 490.70892, "r_x3": 308.862, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.68954, "r_y0": 501.45663, "r_x1": 460.84848, "r_y1": 501.45663, "r_x2": 460.84848, "r_y2": 490.70892, "r_x3": 325.68954, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 512.89337, "r": 545.11517, "b": 653.30592, "coord_origin": "TOPLEFT" }, "confidence": 0.9875594973564148, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 521.79993, "r_x1": 545.11505, "r_y1": 521.79993, "r_x2": 545.11505, "r_y2": 512.89337, "r_x3": 320.81699, "r_y3": 512.89337, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.75491, "r_x1": 545.11517, "r_y1": 533.75491, "r_x2": 545.11517, "r_y2": 524.84836, "r_x3": 308.862, "r_y3": 524.84836, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.70992, "r_x1": 545.11511, "r_y1": 545.70992, "r_x2": 545.11511, "r_y2": 536.80336, "r_x3": 308.862, "r_y3": 536.80336, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.6649199999999, "r_x1": 545.11505, "r_y1": 557.6649199999999, "r_x2": 545.11505, "r_y2": 548.75836, "r_x3": 308.862, "r_y3": 548.75836, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.61992, "r_x1": 545.11517, "r_y1": 569.61992, "r_x2": 545.11517, "r_y2": 560.71336, "r_x3": 308.862, "r_y3": 560.71336, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.57492, "r_x1": 545.11511, "r_y1": 581.57492, "r_x2": 545.11511, "r_y2": 572.66837, "r_x3": 308.862, "r_y3": 572.66837, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.53091, "r_x1": 545.11511, "r_y1": 593.53091, "r_x2": 545.11511, "r_y2": 584.62436, "r_x3": 308.862, "r_y3": 584.62436, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.48592, "r_x1": 400.46808, "r_y1": 605.48592, "r_x2": 400.46808, "r_y2": 596.57936, "r_x3": 308.862, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.37839, "r_y0": 605.48592, "r_x1": 545.11511, "r_y1": 605.48592, "r_x2": 545.11511, "r_y2": 596.57936, "r_x3": 408.37839, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.44092, "r_x1": 545.11505, "r_y1": 617.44092, "r_x2": 545.11505, "r_y2": 608.53436, "r_x3": 308.862, "r_y3": 608.53436, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.3959199999999, "r_x1": 545.11511, "r_y1": 629.3959199999999, "r_x2": 545.11511, "r_y2": 620.48936, "r_x3": 308.862, "r_y3": 620.48936, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.35092, "r_x1": 545.11505, "r_y1": 641.35092, "r_x2": 545.11505, "r_y2": 632.4443699999999, "r_x3": 308.862, "r_y3": 632.4443699999999, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.30592, "r_x1": 365.85803, "r_y1": 653.30592, "r_x2": 365.85803, "r_y2": 644.39937, "r_x3": 308.862, "r_y3": 644.39937, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 308.862, "t": 672.09892, "r": 364.40585, "b": 682.84664, "coord_origin": "TOPLEFT" }, "confidence": 0.9442470073699951, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 682.84664, "r_x1": 364.40585, "r_y1": 682.84664, "r_x2": 364.40585, "r_y2": 672.09892, "r_x3": 308.862, "r_y3": 672.09892, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 313.345, "t": 693.9617920000001, "r": 545.1134, "b": 712.936752, "coord_origin": "TOPLEFT" }, "confidence": 0.8318753838539124, "cells": [ { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.345, "r_y0": 701.977753, "r_x1": 323.80792, "r_y1": 701.977753, "r_x2": 323.80792, "r_y2": 693.9617920000001, "r_x3": 313.345, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05127, "r_y0": 701.977753, "r_x1": 545.10852, "r_y1": 701.977753, "r_x2": 545.10852, "r_y2": 693.9617920000001, "r_x3": 326.05127, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 712.936752, "r_x1": 545.1134, "r_y1": 712.936752, "r_x2": 545.1134, "r_y2": 704.920792, "r_x3": 328.78101, "r_y3": 704.920792, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133366, "r": 300.10229, "b": 743.039928, "coord_origin": "TOPLEFT" }, "confidence": 0.8709858059883118, "cells": [ { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "picture", "bbox": { "l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT" }, "confidence": 0.7699173092842102, "cells": [], "children": [] }, { "id": 14, "label": "picture", "bbox": { "l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT" }, "confidence": 0.7873926162719727, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "8": { "label": "table", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "table", "bbox": { "l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT" }, "confidence": 0.8824009299278259, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93285, "t": 222.18073000000004, "r": 241.04458999999997, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76489, "t": 222.18073000000004, "r": 284.50589, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.24990999999999, "t": 229.66594999999995, "r": 120.62018, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.36609, "t": 229.66594999999995, "r": 196.1071, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.10756, "t": 229.66594999999995, "r": 201.29247, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62408, "t": 229.66594999999995, "r": 219.99435, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.19814, "t": 229.66594999999995, "r": 244.75377, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.1142, "t": 229.66594999999995, "r": 266.48447, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38434, "t": 229.66594999999995, "r": 293.93997, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53052099999999, "t": 236.42584, "r": 162.7131, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.39731, "t": 236.42584, "r": 189.56456, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99026, "t": 236.42584, "r": 214.15752, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.87517, "t": 236.42584, "r": 237.45833000000002, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88446, "t": 236.42584, "r": 264.6358, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06134, "t": 236.42584, "r": 286.6445, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53052099999999, "t": 242.62048000000004, "r": 139.72253, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.10536, "t": 242.62048000000004, "r": 190.8567, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.69832, "t": 242.62048000000004, "r": 215.44965999999997, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.87517, "t": 242.62048000000004, "r": 237.45833000000002, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88446, "t": 242.62048000000004, "r": 264.6358, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06134, "t": 242.62048000000004, "r": 286.6445, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53052099999999, "t": 249.79845999999998, "r": 97.013, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.698288, "t": 249.58942000000002, "r": 103.03371, "b": 253.94732999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03389, "t": 249.79845999999998, "r": 128.96027, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.10536, "t": 248.81506000000002, "r": 190.8567, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28223, "t": 248.81506000000002, "r": 212.86539, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29153, "t": 248.81506000000002, "r": 240.04287999999997, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88446, "t": 248.81506000000002, "r": 264.6358, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.47742, "t": 248.81506000000002, "r": 289.22876, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53052099999999, "t": 257.28369, "r": 91.827637, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.052673, "t": 257.07465, "r": 93.219925, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.220474, "t": 257.28369, "r": 119.14685, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45073999999998, "t": 257.07465, "r": 129.88177, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.10536, "t": 256.30029, "r": 190.8567, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28223, "t": 256.30029, "r": 212.86539, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29153, "t": 256.30029, "r": 240.04287999999997, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88446, "t": 256.30029, "r": 264.6358, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.47742, "t": 256.30029, "r": 289.22876, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53052099999999, "t": 264.5108, "r": 60.715424, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.17654799999999, "t": 264.30175999999994, "r": 65.343796, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.344376, "t": 264.5108, "r": 122.38297000000001, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45073999999998, "t": 264.30175999999994, "r": 129.88177, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.10536, "t": 263.52739999999994, "r": 190.8567, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28223, "t": 263.52739999999994, "r": 212.86539, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29153, "t": 263.52739999999994, "r": 240.04287999999997, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88446, "t": 263.52739999999994, "r": 264.6358, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.47742, "t": 263.52739999999994, "r": 289.22876, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53052099999999, "t": 271.73785, "r": 107.38374, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99034, "t": 271.52881, "r": 109.74168000000002, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74204, "t": 271.73785, "r": 114.92695000000002, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.38793, "t": 271.52881, "r": 122.13927, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.13963, "t": 271.73785, "r": 127.32454000000001, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.39731, "t": 270.75446, "r": 189.56456, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28223, "t": 270.75446, "r": 212.86539, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58348, "t": 270.75446, "r": 238.75072999999998, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88446, "t": 270.75446, "r": 264.6358, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.47742, "t": 270.75446, "r": 289.22876, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53052099999999, "t": 279.01392, "r": 68.68605, "b": 283.37183, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.685814, "t": 279.22295999999994, "r": 110.16829999999999, "b": 283.40436, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.10536, "t": 277.98157000000003, "r": 190.8567, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99026, "t": 277.98157000000003, "r": 214.15752, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58348, "t": 277.98157000000003, "r": 238.75072999999998, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88446, "t": 277.98157000000003, "r": 264.6358, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.76938, "t": 277.98157000000003, "r": 287.93661, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.61508, "t": 286.45004, "r": 174.79999, "b": 290.63141, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.10536, "t": 285.46667, "r": 190.8567, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.69832, "t": 285.46667, "r": 215.44965999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29153, "t": 285.46667, "r": 240.04287999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.76506, "t": 285.46667, "r": 265.75204, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.47742, "t": 285.46667, "r": 289.22876, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 10, "num_cols": 6, "table_cells": [ { "bbox": { "l": 209.93285, "t": 222.18073000000004, "r": 241.04458999999997, "b": 226.36212, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 263.76489, "t": 222.18073000000004, "r": 284.50589, "b": 226.36212, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 110.24990999999999, "t": 229.66594999999995, "r": 120.62018, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 175.36609, "t": 229.66594999999995, "r": 196.1071, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb \u6570", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 209.62408, "t": 229.66594999999995, "r": 219.99435, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 229.19814, "t": 229.66594999999995, "r": 244.75377, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 256.1142, "t": 229.66594999999995, "r": 266.48447, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 278.38434, "t": 229.66594999999995, "r": 293.93997, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 236.42584, "r": 162.7131, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.39731, "t": 236.42584, "r": 189.56456, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99026, "t": 236.42584, "r": 214.15752, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.87517, "t": 236.42584, "r": 237.45833000000002, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 236.42584, "r": 264.6358, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06134, "t": 236.42584, "r": 286.6445, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 242.62048000000004, "r": 139.72253, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 242.62048000000004, "r": 190.8567, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.69832, "t": 242.62048000000004, "r": 215.44965999999997, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.87517, "t": 242.62048000000004, "r": 237.45833000000002, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 242.62048000000004, "r": 264.6358, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06134, "t": 242.62048000000004, "r": 286.6445, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 249.79845999999998, "r": 97.013, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 248.81506000000002, "r": 190.8567, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 248.81506000000002, "r": 212.86539, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 248.81506000000002, "r": 240.04287999999997, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 248.81506000000002, "r": 264.6358, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 248.81506000000002, "r": 289.22876, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 257.28369, "r": 91.827637, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 256.30029, "r": 190.8567, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 256.30029, "r": 212.86539, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 256.30029, "r": 240.04287999999997, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 256.30029, "r": 264.6358, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 256.30029, "r": 289.22876, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 264.5108, "r": 60.715424, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 263.52739999999994, "r": 190.8567, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 263.52739999999994, "r": 212.86539, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 263.52739999999994, "r": 240.04287999999997, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 263.52739999999994, "r": 264.6358, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 263.52739999999994, "r": 289.22876, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 271.73785, "r": 107.38374, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.39731, "t": 270.75446, "r": 189.56456, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 270.75446, "r": 212.86539, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58348, "t": 270.75446, "r": 238.75072999999998, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 270.75446, "r": 264.6358, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 270.75446, "r": 289.22876, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 279.01392, "r": 68.68605, "b": 283.37183, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 277.98157000000003, "r": 190.8567, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99026, "t": 277.98157000000003, "r": 214.15752, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58348, "t": 277.98157000000003, "r": 238.75072999999998, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 277.98157000000003, "r": 264.6358, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 282.76938, "t": 277.98157000000003, "r": 287.93661, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 169.61508, "t": 286.45004, "r": 174.79999, "b": 290.63141, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 285.46667, "r": 190.8567, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.69832, "t": 285.46667, "r": 215.44965999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 285.46667, "r": 240.04287999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 255.76506, "t": 285.46667, "r": 265.75204, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 285.46667, "r": 289.22876, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false } ] }, "7": { "label": "table", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "table", "bbox": { "l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8899767994880676, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.04861, "t": 221.62415, "r": 542.00018, "b": 226.68933000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82193, "t": 227.83416999999997, "r": 507.2258, "b": 232.89935000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.2442, "t": 236.74712999999997, "r": 400.74588, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.74643, "t": 236.74712999999997, "r": 404.64523, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.6463, "t": 236.74712999999997, "r": 407.34631, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.09671, "t": 221.57446000000004, "r": 438.0145, "b": 226.63964999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18323, "t": 236.74712999999997, "r": 440.98778999999996, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38254, "t": 236.74712999999997, "r": 482.48465000000004, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.92578, "t": 236.74712999999997, "r": 530.73035, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11493, "t": 244.61084000000005, "r": 355.6532, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65427, "t": 244.61084000000005, "r": 364.65607, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.24661, "t": 244.91327, "r": 400.75238, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.7529, "t": 244.91327, "r": 403.75531, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.81838999999997, "t": 244.91327, "r": 437.32708999999994, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.52859, "t": 244.91327, "r": 478.40103, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.97552, "t": 244.91327, "r": 483.55001999999996, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.44824, "t": 244.91327, "r": 531.46967, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11493, "t": 253.68451000000005, "r": 325.62674, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.24661, "t": 253.68451000000005, "r": 400.75238, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.7529, "t": 253.68451000000005, "r": 403.75531, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.81838999999997, "t": 253.68451000000005, "r": 437.32708999999994, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.43579000000005, "t": 253.68451000000005, "r": 482.54831, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29065, "t": 253.68451000000005, "r": 530.80981, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11493, "t": 261.54822, "r": 322.62866, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43222, "t": 261.54822, "r": 400.73563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73456, "t": 261.54822, "r": 403.73697, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.73804, "t": 261.54822, "r": 405.53625, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7016, "t": 261.54822, "r": 438.80563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.55533, "t": 261.54822, "r": 482.07043, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.01862, "t": 261.54822, "r": 529.53375, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11493, "t": 269.64148, "r": 356.24771, "b": 274.70667000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43222, "t": 270.31946000000005, "r": 400.73563, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73456, "t": 270.31946000000005, "r": 403.73697, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.73804, "t": 270.31946000000005, "r": 405.53625, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.02802, "t": 270.31946000000005, "r": 436.4280099999999, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83099000000004, "t": 270.31946000000005, "r": 482.35013, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.01862, "t": 270.31946000000005, "r": 529.53375, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11493, "t": 278.48572, "r": 373.35764, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.24661, "t": 278.48572, "r": 403.75531, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.51599, "t": 278.48572, "r": 437.02469, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.7142, "t": 278.48572, "r": 484.73965000000004, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99463, "t": 278.48572, "r": 534.02008, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 459.04861, "t": 221.62415, "r": 542.00018, "b": 226.68933000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 393.2442, "t": 236.74712999999997, "r": 400.74588, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RS U s", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 392.09671, "t": 221.57446000000004, "r": 438.0145, "b": 226.63964999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.18323, "t": 236.74712999999997, "r": 440.98778999999996, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 468.38254, "t": 236.74712999999997, "r": 482.48465000000004, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 516.92578, "t": 236.74712999999997, "r": 530.73035, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 244.61084000000005, "r": 355.6532, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on Janua ry 1", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 244.91327, "r": 400.75238, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1. 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.81838999999997, "t": 244.91327, "r": 437.32708999999994, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.52859, "t": 244.91327, "r": 478.40103, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.44824, "t": 244.91327, "r": 531.46967, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 253.68451000000005, "r": 325.62674, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 253.68451000000005, "r": 400.75238, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0. 5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.81838999999997, "t": 253.68451000000005, "r": 437.32708999999994, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 466.43579000000005, "t": 253.68451000000005, "r": 482.54831, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 514.29065, "t": 253.68451000000005, "r": 530.80981, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 261.54822, "r": 322.62866, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43222, "t": 261.54822, "r": 400.73563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 5 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 427.7016, "t": 261.54822, "r": 438.80563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 468.55533, "t": 261.54822, "r": 482.07043, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.01862, "t": 261.54822, "r": 529.53375, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 269.64148, "r": 356.24771, "b": 274.70667000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43222, "t": 270.31946000000005, "r": 400.73563, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 1 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 431.02802, "t": 270.31946000000005, "r": 436.4280099999999, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.83099000000004, "t": 270.31946000000005, "r": 482.35013, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.01862, "t": 270.31946000000005, "r": 529.53375, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 278.48572, "r": 373.35764, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 278.48572, "r": 403.75531, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.51599, "t": 278.48572, "r": 437.02469, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 463.7142, "t": 278.48572, "r": 484.73965000000004, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.99463, "t": 278.48572, "r": 534.02008, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 18, "page_no": 7, "cluster": { "id": 18, "label": "caption", "bbox": { "l": 53.811783000000005, "t": 208.23328000000004, "r": 385.93451, "b": 216.10645, "coord_origin": "TOPLEFT" }, "confidence": 0.5986505746841431, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 216.10645, "r_x1": 62.219952, "r_y1": 216.10645, "r_x2": 62.219952, "r_y2": 208.23328000000004, "r_x3": 53.811783000000005, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.424026, "r_y0": 216.10645, "r_x1": 385.93451, "r_y1": 216.10645, "r_x2": 385.93451, "r_y2": 208.23328000000004, "r_x3": 66.424026, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:" }, { "label": "section_header", "id": 29, "page_no": 7, "cluster": { "id": 29, "label": "section_header", "bbox": { "l": 53.811783000000005, "t": 94.28112999999996, "r": 284.34592, "b": 102.15430000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.46452972292900085, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 102.15430000000003, "r_x1": 284.34592, "r_y1": 102.15430000000003, "r_x2": 284.34592, "r_y2": 94.28112999999996, "r_x3": 53.811783000000005, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Japanese language (previously unseen by TableFormer):" }, { "label": "section_header", "id": 31, "page_no": 7, "cluster": { "id": 31, "label": "section_header", "bbox": { "l": 304.83081, "t": 94.28112999999996, "r": 431.09119, "b": 102.15430000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.4629225730895996, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83081, "r_y0": 102.15430000000003, "r_x1": 431.09119, "r_y1": 102.15430000000003, "r_x2": 431.09119, "r_y2": 94.28112999999996, "r_x3": 304.83081, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Example table from FinTabNet:" }, { "label": "list_item", "id": 20, "page_no": 7, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 53.286037, "t": 78.68756000000008, "r": 61.550289, "b": 86.56073000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.5820134282112122, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.286037, "r_y0": 86.56073000000004, "r_x1": 61.550289, "r_y1": 86.56073000000004, "r_x2": 61.550289, "r_y2": 78.68756000000008, "r_x3": 53.286037, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a." }, { "label": "list_item", "id": 21, "page_no": 7, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 65.682419, "t": 78.68756000000008, "r": 499.55563, "b": 86.56073000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.541211724281311, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.682419, "r_y0": 86.56073000000004, "r_x1": 499.55563, "r_y1": 86.56073000000004, "r_x2": 499.55563, "r_y2": 78.68756000000008, "r_x3": 65.682419, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells" }, { "label": "table", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "table", "bbox": { "l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT" }, "confidence": 0.8824009299278259, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93285, "t": 222.18073000000004, "r": 241.04458999999997, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76489, "t": 222.18073000000004, "r": 284.50589, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.24990999999999, "t": 229.66594999999995, "r": 120.62018, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.36609, "t": 229.66594999999995, "r": 196.1071, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.10756, "t": 229.66594999999995, "r": 201.29247, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62408, "t": 229.66594999999995, "r": 219.99435, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.19814, "t": 229.66594999999995, "r": 244.75377, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.1142, "t": 229.66594999999995, "r": 266.48447, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38434, "t": 229.66594999999995, "r": 293.93997, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53052099999999, "t": 236.42584, "r": 162.7131, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.39731, "t": 236.42584, "r": 189.56456, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99026, "t": 236.42584, "r": 214.15752, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.87517, "t": 236.42584, "r": 237.45833000000002, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88446, "t": 236.42584, "r": 264.6358, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06134, "t": 236.42584, "r": 286.6445, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53052099999999, "t": 242.62048000000004, "r": 139.72253, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.10536, "t": 242.62048000000004, "r": 190.8567, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.69832, "t": 242.62048000000004, "r": 215.44965999999997, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.87517, "t": 242.62048000000004, "r": 237.45833000000002, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88446, "t": 242.62048000000004, "r": 264.6358, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06134, "t": 242.62048000000004, "r": 286.6445, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53052099999999, "t": 249.79845999999998, "r": 97.013, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.698288, "t": 249.58942000000002, "r": 103.03371, "b": 253.94732999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03389, "t": 249.79845999999998, "r": 128.96027, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.10536, "t": 248.81506000000002, "r": 190.8567, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28223, "t": 248.81506000000002, "r": 212.86539, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29153, "t": 248.81506000000002, "r": 240.04287999999997, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88446, "t": 248.81506000000002, "r": 264.6358, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.47742, "t": 248.81506000000002, "r": 289.22876, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53052099999999, "t": 257.28369, "r": 91.827637, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.052673, "t": 257.07465, "r": 93.219925, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.220474, "t": 257.28369, "r": 119.14685, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45073999999998, "t": 257.07465, "r": 129.88177, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.10536, "t": 256.30029, "r": 190.8567, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28223, "t": 256.30029, "r": 212.86539, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29153, "t": 256.30029, "r": 240.04287999999997, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88446, "t": 256.30029, "r": 264.6358, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.47742, "t": 256.30029, "r": 289.22876, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53052099999999, "t": 264.5108, "r": 60.715424, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.17654799999999, "t": 264.30175999999994, "r": 65.343796, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.344376, "t": 264.5108, "r": 122.38297000000001, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45073999999998, "t": 264.30175999999994, "r": 129.88177, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.10536, "t": 263.52739999999994, "r": 190.8567, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28223, "t": 263.52739999999994, "r": 212.86539, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29153, "t": 263.52739999999994, "r": 240.04287999999997, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88446, "t": 263.52739999999994, "r": 264.6358, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.47742, "t": 263.52739999999994, "r": 289.22876, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53052099999999, "t": 271.73785, "r": 107.38374, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99034, "t": 271.52881, "r": 109.74168000000002, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74204, "t": 271.73785, "r": 114.92695000000002, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.38793, "t": 271.52881, "r": 122.13927, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.13963, "t": 271.73785, "r": 127.32454000000001, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.39731, "t": 270.75446, "r": 189.56456, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28223, "t": 270.75446, "r": 212.86539, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58348, "t": 270.75446, "r": 238.75072999999998, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88446, "t": 270.75446, "r": 264.6358, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.47742, "t": 270.75446, "r": 289.22876, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53052099999999, "t": 279.01392, "r": 68.68605, "b": 283.37183, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.685814, "t": 279.22295999999994, "r": 110.16829999999999, "b": 283.40436, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.10536, "t": 277.98157000000003, "r": 190.8567, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99026, "t": 277.98157000000003, "r": 214.15752, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58348, "t": 277.98157000000003, "r": 238.75072999999998, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88446, "t": 277.98157000000003, "r": 264.6358, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.76938, "t": 277.98157000000003, "r": 287.93661, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.61508, "t": 286.45004, "r": 174.79999, "b": 290.63141, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.10536, "t": 285.46667, "r": 190.8567, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.69832, "t": 285.46667, "r": 215.44965999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29153, "t": 285.46667, "r": 240.04287999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.76506, "t": 285.46667, "r": 265.75204, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.47742, "t": 285.46667, "r": 289.22876, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 10, "num_cols": 6, "table_cells": [ { "bbox": { "l": 209.93285, "t": 222.18073000000004, "r": 241.04458999999997, "b": 226.36212, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 263.76489, "t": 222.18073000000004, "r": 284.50589, "b": 226.36212, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 110.24990999999999, "t": 229.66594999999995, "r": 120.62018, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 175.36609, "t": 229.66594999999995, "r": 196.1071, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb \u6570", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 209.62408, "t": 229.66594999999995, "r": 219.99435, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 229.19814, "t": 229.66594999999995, "r": 244.75377, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 256.1142, "t": 229.66594999999995, "r": 266.48447, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 278.38434, "t": 229.66594999999995, "r": 293.93997, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 236.42584, "r": 162.7131, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.39731, "t": 236.42584, "r": 189.56456, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99026, "t": 236.42584, "r": 214.15752, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.87517, "t": 236.42584, "r": 237.45833000000002, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 236.42584, "r": 264.6358, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06134, "t": 236.42584, "r": 286.6445, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 242.62048000000004, "r": 139.72253, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 242.62048000000004, "r": 190.8567, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.69832, "t": 242.62048000000004, "r": 215.44965999999997, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.87517, "t": 242.62048000000004, "r": 237.45833000000002, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 242.62048000000004, "r": 264.6358, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06134, "t": 242.62048000000004, "r": 286.6445, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 249.79845999999998, "r": 97.013, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 248.81506000000002, "r": 190.8567, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 248.81506000000002, "r": 212.86539, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 248.81506000000002, "r": 240.04287999999997, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 248.81506000000002, "r": 264.6358, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 248.81506000000002, "r": 289.22876, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 257.28369, "r": 91.827637, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 256.30029, "r": 190.8567, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 256.30029, "r": 212.86539, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 256.30029, "r": 240.04287999999997, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 256.30029, "r": 264.6358, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 256.30029, "r": 289.22876, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 264.5108, "r": 60.715424, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 263.52739999999994, "r": 190.8567, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 263.52739999999994, "r": 212.86539, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 263.52739999999994, "r": 240.04287999999997, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 263.52739999999994, "r": 264.6358, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 263.52739999999994, "r": 289.22876, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 271.73785, "r": 107.38374, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.39731, "t": 270.75446, "r": 189.56456, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 270.75446, "r": 212.86539, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58348, "t": 270.75446, "r": 238.75072999999998, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 270.75446, "r": 264.6358, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 270.75446, "r": 289.22876, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 279.01392, "r": 68.68605, "b": 283.37183, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 277.98157000000003, "r": 190.8567, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99026, "t": 277.98157000000003, "r": 214.15752, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58348, "t": 277.98157000000003, "r": 238.75072999999998, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 277.98157000000003, "r": 264.6358, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 282.76938, "t": 277.98157000000003, "r": 287.93661, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 169.61508, "t": 286.45004, "r": 174.79999, "b": 290.63141, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 285.46667, "r": 190.8567, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.69832, "t": 285.46667, "r": 215.44965999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 285.46667, "r": 240.04287999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 255.76506, "t": 285.46667, "r": 265.75204, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 285.46667, "r": 289.22876, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 16, "page_no": 7, "cluster": { "id": 16, "label": "caption", "bbox": { "l": 380.42731, "t": 292.30426, "r": 549.42175, "b": 298.60284, "coord_origin": "TOPLEFT" }, "confidence": 0.7499915957450867, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.42731, "r_y0": 298.60284, "r_x1": 549.42175, "r_y1": 298.60284, "r_x2": 549.42175, "r_y2": 292.30426, "r_x3": 380.42731, "r_y3": 292.30426, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Text is aligned to match original for ease of viewing" }, { "label": "table", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "table", "bbox": { "l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8899767994880676, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.04861, "t": 221.62415, "r": 542.00018, "b": 226.68933000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82193, "t": 227.83416999999997, "r": 507.2258, "b": 232.89935000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.2442, "t": 236.74712999999997, "r": 400.74588, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.74643, "t": 236.74712999999997, "r": 404.64523, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.6463, "t": 236.74712999999997, "r": 407.34631, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.09671, "t": 221.57446000000004, "r": 438.0145, "b": 226.63964999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18323, "t": 236.74712999999997, "r": 440.98778999999996, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38254, "t": 236.74712999999997, "r": 482.48465000000004, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.92578, "t": 236.74712999999997, "r": 530.73035, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11493, "t": 244.61084000000005, "r": 355.6532, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65427, "t": 244.61084000000005, "r": 364.65607, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.24661, "t": 244.91327, "r": 400.75238, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.7529, "t": 244.91327, "r": 403.75531, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.81838999999997, "t": 244.91327, "r": 437.32708999999994, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.52859, "t": 244.91327, "r": 478.40103, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.97552, "t": 244.91327, "r": 483.55001999999996, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.44824, "t": 244.91327, "r": 531.46967, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11493, "t": 253.68451000000005, "r": 325.62674, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.24661, "t": 253.68451000000005, "r": 400.75238, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.7529, "t": 253.68451000000005, "r": 403.75531, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.81838999999997, "t": 253.68451000000005, "r": 437.32708999999994, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.43579000000005, "t": 253.68451000000005, "r": 482.54831, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29065, "t": 253.68451000000005, "r": 530.80981, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11493, "t": 261.54822, "r": 322.62866, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43222, "t": 261.54822, "r": 400.73563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73456, "t": 261.54822, "r": 403.73697, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.73804, "t": 261.54822, "r": 405.53625, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7016, "t": 261.54822, "r": 438.80563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.55533, "t": 261.54822, "r": 482.07043, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.01862, "t": 261.54822, "r": 529.53375, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11493, "t": 269.64148, "r": 356.24771, "b": 274.70667000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43222, "t": 270.31946000000005, "r": 400.73563, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73456, "t": 270.31946000000005, "r": 403.73697, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.73804, "t": 270.31946000000005, "r": 405.53625, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.02802, "t": 270.31946000000005, "r": 436.4280099999999, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83099000000004, "t": 270.31946000000005, "r": 482.35013, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.01862, "t": 270.31946000000005, "r": 529.53375, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11493, "t": 278.48572, "r": 373.35764, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.24661, "t": 278.48572, "r": 403.75531, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.51599, "t": 278.48572, "r": 437.02469, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.7142, "t": 278.48572, "r": 484.73965000000004, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99463, "t": 278.48572, "r": 534.02008, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 459.04861, "t": 221.62415, "r": 542.00018, "b": 226.68933000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 393.2442, "t": 236.74712999999997, "r": 400.74588, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RS U s", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 392.09671, "t": 221.57446000000004, "r": 438.0145, "b": 226.63964999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.18323, "t": 236.74712999999997, "r": 440.98778999999996, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 468.38254, "t": 236.74712999999997, "r": 482.48465000000004, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 516.92578, "t": 236.74712999999997, "r": 530.73035, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 244.61084000000005, "r": 355.6532, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on Janua ry 1", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 244.91327, "r": 400.75238, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1. 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.81838999999997, "t": 244.91327, "r": 437.32708999999994, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.52859, "t": 244.91327, "r": 478.40103, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.44824, "t": 244.91327, "r": 531.46967, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 253.68451000000005, "r": 325.62674, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 253.68451000000005, "r": 400.75238, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0. 5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.81838999999997, "t": 253.68451000000005, "r": 437.32708999999994, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 466.43579000000005, "t": 253.68451000000005, "r": 482.54831, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 514.29065, "t": 253.68451000000005, "r": 530.80981, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 261.54822, "r": 322.62866, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43222, "t": 261.54822, "r": 400.73563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 5 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 427.7016, "t": 261.54822, "r": 438.80563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 468.55533, "t": 261.54822, "r": 482.07043, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.01862, "t": 261.54822, "r": 529.53375, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 269.64148, "r": 356.24771, "b": 274.70667000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43222, "t": 270.31946000000005, "r": 400.73563, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 1 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 431.02802, "t": 270.31946000000005, "r": 436.4280099999999, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.83099000000004, "t": 270.31946000000005, "r": 482.35013, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.01862, "t": 270.31946000000005, "r": 529.53375, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 278.48572, "r": 373.35764, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 278.48572, "r": 403.75531, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.51599, "t": 278.48572, "r": 437.02469, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 463.7142, "t": 278.48572, "r": 484.73965000000004, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.99463, "t": 278.48572, "r": 534.02008, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.112, "t": 320.87735, "r": 545.11377, "b": 365.64987, "coord_origin": "TOPLEFT" }, "confidence": 0.9140303134918213, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 329.78391, "r_x1": 86.864021, "r_y1": 329.78391, "r_x2": 86.864021, "r_y2": 320.87735, "r_x3": 50.112, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.917542, "r_y0": 329.78391, "r_x1": 545.11371, "r_y1": 329.78391, "r_x2": 545.11371, "r_y2": 320.87735, "r_x3": 93.917542, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 341.73889, "r_x1": 545.11371, "r_y1": 341.73889, "r_x2": 545.11371, "r_y2": 332.83233999999993, "r_x3": 50.112, "r_y3": 332.83233999999993, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 353.69388, "r_x1": 545.11377, "r_y1": 353.69388, "r_x2": 545.11377, "r_y2": 344.78732, "r_x3": 50.112, "r_y3": 344.78732, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.64987, "r_x1": 139.79532, "r_y1": 365.64987, "r_x2": 139.79532, "r_y2": 356.74332, "r_x3": 50.112, "r_y3": 356.74332, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset." }, { "label": "picture", "id": 12, "page_no": 7, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT" }, "confidence": 0.805853009223938, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26282, "r_y0": 386.44281, "r_x1": 342.07819, "r_y1": 386.44281, "r_x2": 342.07819, "r_y2": 381.77722, "r_x3": 220.26282, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 167, "label": "text", "bbox": { "l": 220.26282, "t": 381.77722, "r": 342.07819, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26282, "r_y0": 386.44281, "r_x1": 342.07819, "r_y1": 386.44281, "r_x2": 342.07819, "r_y2": 381.77722, "r_x3": 220.26282, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 11, "page_no": 7, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT" }, "confidence": 0.8308426737785339, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.715248, "r_y0": 386.44281, "r_x1": 85.657333, "r_y1": 386.44281, "r_x2": 85.657333, "r_y2": 381.77722, "r_x3": 53.715248, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 168, "label": "text", "bbox": { "l": 53.715248, "t": 381.77722, "r": 85.657333, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.715248, "r_y0": 386.44281, "r_x1": 85.657333, "r_y1": 386.44281, "r_x2": 85.657333, "r_y2": 381.77722, "r_x3": 53.715248, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 13, "page_no": 7, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT" }, "confidence": 0.7881615161895752, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 406.87158, "r_x1": 443.69870000000003, "r_y1": 406.87158, "r_x2": 443.69870000000003, "r_y2": 400.55295, "r_x3": 437.37939, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 406.87158, "r_x1": 456.6513100000001, "r_y1": 406.87158, "r_x2": 456.6513100000001, "r_y2": 400.55295, "r_x3": 450.33203, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 406.87158, "r_x1": 469.60394, "r_y1": 406.87158, "r_x2": 469.60394, "r_y2": 400.55295, "r_x3": 463.28464, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23724000000004, "r_y0": 406.87158, "r_x1": 482.5565500000001, "r_y1": 406.87158, "r_x2": 482.5565500000001, "r_y2": 400.55295, "r_x3": 476.23724000000004, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18988, "r_y0": 406.87158, "r_x1": 495.50916, "r_y1": 406.87158, "r_x2": 495.50916, "r_y2": 400.55295, "r_x3": 489.18988, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14251999999993, "r_y0": 406.87158, "r_x1": 508.46178999999995, "r_y1": 406.87158, "r_x2": 508.46178999999995, "r_y2": 400.55295, "r_x3": 502.14251999999993, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09509, "r_y0": 406.87158, "r_x1": 521.41443, "r_y1": 406.87158, "r_x2": 521.41443, "r_y2": 400.55295, "r_x3": 515.09509, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 417.35699, "r_x1": 391.60071, "r_y1": 417.35699, "r_x2": 391.60071, "r_y2": 411.03836000000007, "r_x3": 385.2814, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 417.35699, "r_x1": 404.84271, "r_y1": 417.35699, "r_x2": 404.84271, "r_y2": 411.03836000000007, "r_x3": 398.52341, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 417.35699, "r_x1": 417.79535, "r_y1": 417.35699, "r_x2": 417.79535, "r_y2": 411.03836000000007, "r_x3": 411.47604, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 417.35699, "r_x1": 443.69870000000003, "r_y1": 417.35699, "r_x2": 443.69870000000003, "r_y2": 411.03836000000007, "r_x3": 437.37939, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 417.35699, "r_x1": 456.6513100000001, "r_y1": 417.35699, "r_x2": 456.6513100000001, "r_y2": 411.03836000000007, "r_x3": 450.33203, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 417.35699, "r_x1": 469.60394, "r_y1": 417.35699, "r_x2": 469.60394, "r_y2": 411.03836000000007, "r_x3": 463.28464, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 427.38834, "r_x1": 391.60071, "r_y1": 427.38834, "r_x2": 391.60071, "r_y2": 421.0697, "r_x3": 385.2814, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 427.38834, "r_x1": 404.84271, "r_y1": 427.38834, "r_x2": 404.84271, "r_y2": 421.0697, "r_x3": 398.52341, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 427.38834, "r_x1": 417.79532, "r_y1": 427.38834, "r_x2": 417.79532, "r_y2": 421.0697, "r_x3": 411.47604, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 427.38834, "r_x1": 430.74796, "r_y1": 427.38834, "r_x2": 430.74796, "r_y2": 421.0697, "r_x3": 424.42865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 427.38834, "r_x1": 443.70056, "r_y1": 427.38834, "r_x2": 443.70056, "r_y2": 421.0697, "r_x3": 437.38129, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 427.38834, "r_x1": 456.65319999999997, "r_y1": 427.38834, "r_x2": 456.65319999999997, "r_y2": 421.0697, "r_x3": 450.33389000000005, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 427.38834, "r_x1": 469.6058, "r_y1": 427.38834, "r_x2": 469.6058, "r_y2": 421.0697, "r_x3": 463.2865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 427.38834, "r_x1": 482.55841, "r_y1": 427.38834, "r_x2": 482.55841, "r_y2": 421.0697, "r_x3": 476.23914, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 427.38834, "r_x1": 495.51105, "r_y1": 427.38834, "r_x2": 495.51105, "r_y2": 421.0697, "r_x3": 489.1917700000001, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 427.38834, "r_x1": 508.46368, "r_y1": 427.38834, "r_x2": 508.46368, "r_y2": 421.0697, "r_x3": 502.14438, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 427.38834, "r_x1": 521.41632, "r_y1": 427.38834, "r_x2": 521.41632, "r_y2": 421.0697, "r_x3": 515.09705, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 427.38834, "r_x1": 534.3689, "r_y1": 427.38834, "r_x2": 534.3689, "r_y2": 421.0697, "r_x3": 528.04962, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 438.36295, "r_x1": 391.60071, "r_y1": 438.36295, "r_x2": 391.60071, "r_y2": 432.04431, "r_x3": 385.2814, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 438.36295, "r_x1": 404.84271, "r_y1": 438.36295, "r_x2": 404.84271, "r_y2": 432.04431, "r_x3": 398.52341, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 438.36295, "r_x1": 417.79532, "r_y1": 438.36295, "r_x2": 417.79532, "r_y2": 432.04431, "r_x3": 411.47604, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 438.36295, "r_x1": 430.74796, "r_y1": 438.36295, "r_x2": 430.74796, "r_y2": 432.04431, "r_x3": 424.42865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 438.36295, "r_x1": 443.70056, "r_y1": 438.36295, "r_x2": 443.70056, "r_y2": 432.04431, "r_x3": 437.38129, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 438.36295, "r_x1": 456.65319999999997, "r_y1": 438.36295, "r_x2": 456.65319999999997, "r_y2": 432.04431, "r_x3": 450.33389000000005, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 438.36295, "r_x1": 469.6058, "r_y1": 438.36295, "r_x2": 469.6058, "r_y2": 432.04431, "r_x3": 463.2865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 438.36295, "r_x1": 482.55841, "r_y1": 438.36295, "r_x2": 482.55841, "r_y2": 432.04431, "r_x3": 476.23914, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 438.36295, "r_x1": 495.51105, "r_y1": 438.36295, "r_x2": 495.51105, "r_y2": 432.04431, "r_x3": 489.1917700000001, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 438.36295, "r_x1": 508.46368, "r_y1": 438.36295, "r_x2": 508.46368, "r_y2": 432.04431, "r_x3": 502.14438, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 438.36295, "r_x1": 521.41632, "r_y1": 438.36295, "r_x2": 521.41632, "r_y2": 432.04431, "r_x3": 515.09705, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 438.36295, "r_x1": 534.3689, "r_y1": 438.36295, "r_x2": 534.3689, "r_y2": 432.04431, "r_x3": 528.04962, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 395.51868, "r_x1": 388.44073, "r_y1": 395.51868, "r_x2": 388.44073, "r_y2": 389.20004, "r_x3": 385.2814, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 395.51868, "r_x1": 401.68274, "r_y1": 395.51868, "r_x2": 401.68274, "r_y2": 389.20004, "r_x3": 398.52341, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.4754, "r_y0": 395.51868, "r_x1": 414.63474, "r_y1": 395.51868, "r_x2": 414.63474, "r_y2": 389.20004, "r_x3": 411.4754, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.4274, "r_y0": 395.51868, "r_x1": 427.58673, "r_y1": 395.51868, "r_x2": 427.58673, "r_y2": 389.20004, "r_x3": 424.4274, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 395.51868, "r_x1": 440.53870000000006, "r_y1": 395.51868, "r_x2": 440.53870000000006, "r_y2": 389.20004, "r_x3": 437.37939, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33136, "r_y0": 395.51868, "r_x1": 453.49069000000003, "r_y1": 395.51868, "r_x2": 453.49069000000003, "r_y2": 389.20004, "r_x3": 450.33136, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28336, "r_y0": 395.51868, "r_x1": 466.44269, "r_y1": 395.51868, "r_x2": 466.44269, "r_y2": 389.20004, "r_x3": 463.28336, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23535, "r_y0": 395.51868, "r_x1": 479.39468, "r_y1": 395.51868, "r_x2": 479.39468, "r_y2": 389.20004, "r_x3": 476.23535, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18735, "r_y0": 395.51868, "r_x1": 492.34668, "r_y1": 395.51868, "r_x2": 492.34668, "r_y2": 389.20004, "r_x3": 489.18735, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.13933999999995, "r_y0": 395.51868, "r_x1": 505.29868000000005, "r_y1": 395.51868, "r_x2": 505.29868000000005, "r_y2": 389.20004, "r_x3": 502.13933999999995, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09131, "r_y0": 395.51868, "r_x1": 521.41064, "r_y1": 395.51868, "r_x2": 521.41064, "r_y2": 389.20004, "r_x3": 515.09131, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04364, "r_y0": 395.51868, "r_x1": 534.13104, "r_y1": 395.51868, "r_x2": 534.13104, "r_y2": 389.20004, "r_x3": 528.04364, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 405.29327, "r_x1": 391.60071, "r_y1": 405.29327, "r_x2": 391.60071, "r_y2": 398.97464, "r_x3": 385.2814, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 405.29327, "r_x1": 404.84271, "r_y1": 405.29327, "r_x2": 404.84271, "r_y2": 398.97464, "r_x3": 398.52341, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 405.29327, "r_x1": 417.79535, "r_y1": 405.29327, "r_x2": 417.79535, "r_y2": 398.97464, "r_x3": 411.47604, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42719, "r_y0": 413.09326, "r_x1": 430.74648999999994, "r_y1": 413.09326, "r_x2": 430.74648999999994, "r_y2": 406.77463000000006, "r_x3": 424.42719, "r_y3": 406.77463000000006, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.86941999999993, "r_y0": 417.31302, "r_x1": 509.18871999999993, "r_y1": 417.31302, "r_x2": 509.18871999999993, "r_y2": 410.99438, "r_x3": 502.86941999999993, "r_y3": 410.99438, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35437, "r_y0": 386.44281, "r_x1": 430.99261, "r_y1": 386.44281, "r_x2": 430.99261, "r_y2": 381.77722, "r_x3": 384.35437, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 169, "label": "text", "bbox": { "l": 437.37939, "t": 400.55295, "r": 443.69870000000003, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 406.87158, "r_x1": 443.69870000000003, "r_y1": 406.87158, "r_x2": 443.69870000000003, "r_y2": 400.55295, "r_x3": 437.37939, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 170, "label": "text", "bbox": { "l": 450.33203, "t": 400.55295, "r": 456.6513100000001, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 406.87158, "r_x1": 456.6513100000001, "r_y1": 406.87158, "r_x2": 456.6513100000001, "r_y2": 400.55295, "r_x3": 450.33203, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 171, "label": "text", "bbox": { "l": 463.28464, "t": 400.55295, "r": 469.60394, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 406.87158, "r_x1": 469.60394, "r_y1": 406.87158, "r_x2": 469.60394, "r_y2": 400.55295, "r_x3": 463.28464, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 172, "label": "text", "bbox": { "l": 476.23724000000004, "t": 400.55295, "r": 482.5565500000001, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23724000000004, "r_y0": 406.87158, "r_x1": 482.5565500000001, "r_y1": 406.87158, "r_x2": 482.5565500000001, "r_y2": 400.55295, "r_x3": 476.23724000000004, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 173, "label": "text", "bbox": { "l": 489.18988, "t": 400.55295, "r": 495.50916, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18988, "r_y0": 406.87158, "r_x1": 495.50916, "r_y1": 406.87158, "r_x2": 495.50916, "r_y2": 400.55295, "r_x3": 489.18988, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 174, "label": "text", "bbox": { "l": 502.14251999999993, "t": 400.55295, "r": 508.46178999999995, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14251999999993, "r_y0": 406.87158, "r_x1": 508.46178999999995, "r_y1": 406.87158, "r_x2": 508.46178999999995, "r_y2": 400.55295, "r_x3": 502.14251999999993, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 175, "label": "text", "bbox": { "l": 515.09509, "t": 400.55295, "r": 521.41443, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09509, "r_y0": 406.87158, "r_x1": 521.41443, "r_y1": 406.87158, "r_x2": 521.41443, "r_y2": 400.55295, "r_x3": 515.09509, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 176, "label": "text", "bbox": { "l": 385.2814, "t": 411.03836000000007, "r": 391.60071, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 417.35699, "r_x1": 391.60071, "r_y1": 417.35699, "r_x2": 391.60071, "r_y2": 411.03836000000007, "r_x3": 385.2814, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 177, "label": "text", "bbox": { "l": 398.52341, "t": 411.03836000000007, "r": 404.84271, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 417.35699, "r_x1": 404.84271, "r_y1": 417.35699, "r_x2": 404.84271, "r_y2": 411.03836000000007, "r_x3": 398.52341, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 178, "label": "text", "bbox": { "l": 411.47604, "t": 411.03836000000007, "r": 417.79535, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 417.35699, "r_x1": 417.79535, "r_y1": 417.35699, "r_x2": 417.79535, "r_y2": 411.03836000000007, "r_x3": 411.47604, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 179, "label": "text", "bbox": { "l": 437.37939, "t": 411.03836000000007, "r": 443.69870000000003, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 417.35699, "r_x1": 443.69870000000003, "r_y1": 417.35699, "r_x2": 443.69870000000003, "r_y2": 411.03836000000007, "r_x3": 437.37939, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 180, "label": "text", "bbox": { "l": 450.33203, "t": 411.03836000000007, "r": 456.6513100000001, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 417.35699, "r_x1": 456.6513100000001, "r_y1": 417.35699, "r_x2": 456.6513100000001, "r_y2": 411.03836000000007, "r_x3": 450.33203, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 181, "label": "text", "bbox": { "l": 463.28464, "t": 411.03836000000007, "r": 469.60394, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 417.35699, "r_x1": 469.60394, "r_y1": 417.35699, "r_x2": 469.60394, "r_y2": 411.03836000000007, "r_x3": 463.28464, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 182, "label": "text", "bbox": { "l": 385.2814, "t": 421.0697, "r": 391.60071, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 427.38834, "r_x1": 391.60071, "r_y1": 427.38834, "r_x2": 391.60071, "r_y2": 421.0697, "r_x3": 385.2814, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 183, "label": "text", "bbox": { "l": 398.52341, "t": 421.0697, "r": 404.84271, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 427.38834, "r_x1": 404.84271, "r_y1": 427.38834, "r_x2": 404.84271, "r_y2": 421.0697, "r_x3": 398.52341, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 184, "label": "text", "bbox": { "l": 411.47604, "t": 421.0697, "r": 417.79532, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 427.38834, "r_x1": 417.79532, "r_y1": 427.38834, "r_x2": 417.79532, "r_y2": 421.0697, "r_x3": 411.47604, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 185, "label": "text", "bbox": { "l": 424.42865, "t": 421.0697, "r": 430.74796, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 427.38834, "r_x1": 430.74796, "r_y1": 427.38834, "r_x2": 430.74796, "r_y2": 421.0697, "r_x3": 424.42865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 186, "label": "text", "bbox": { "l": 437.38129, "t": 421.0697, "r": 443.70056, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 427.38834, "r_x1": 443.70056, "r_y1": 427.38834, "r_x2": 443.70056, "r_y2": 421.0697, "r_x3": 437.38129, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 187, "label": "text", "bbox": { "l": 450.33389000000005, "t": 421.0697, "r": 456.65319999999997, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 427.38834, "r_x1": 456.65319999999997, "r_y1": 427.38834, "r_x2": 456.65319999999997, "r_y2": 421.0697, "r_x3": 450.33389000000005, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 188, "label": "text", "bbox": { "l": 463.2865, "t": 421.0697, "r": 469.6058, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 427.38834, "r_x1": 469.6058, "r_y1": 427.38834, "r_x2": 469.6058, "r_y2": 421.0697, "r_x3": 463.2865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 189, "label": "text", "bbox": { "l": 476.23914, "t": 421.0697, "r": 482.55841, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 427.38834, "r_x1": 482.55841, "r_y1": 427.38834, "r_x2": 482.55841, "r_y2": 421.0697, "r_x3": 476.23914, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 190, "label": "text", "bbox": { "l": 489.1917700000001, "t": 421.0697, "r": 495.51105, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 427.38834, "r_x1": 495.51105, "r_y1": 427.38834, "r_x2": 495.51105, "r_y2": 421.0697, "r_x3": 489.1917700000001, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 191, "label": "text", "bbox": { "l": 502.14438, "t": 421.0697, "r": 508.46368, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 427.38834, "r_x1": 508.46368, "r_y1": 427.38834, "r_x2": 508.46368, "r_y2": 421.0697, "r_x3": 502.14438, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 192, "label": "text", "bbox": { "l": 515.09705, "t": 421.0697, "r": 521.41632, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 427.38834, "r_x1": 521.41632, "r_y1": 427.38834, "r_x2": 521.41632, "r_y2": 421.0697, "r_x3": 515.09705, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 193, "label": "text", "bbox": { "l": 528.04962, "t": 421.0697, "r": 534.3689, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 427.38834, "r_x1": 534.3689, "r_y1": 427.38834, "r_x2": 534.3689, "r_y2": 421.0697, "r_x3": 528.04962, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 194, "label": "text", "bbox": { "l": 385.2814, "t": 432.04431, "r": 391.60071, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 438.36295, "r_x1": 391.60071, "r_y1": 438.36295, "r_x2": 391.60071, "r_y2": 432.04431, "r_x3": 385.2814, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 195, "label": "text", "bbox": { "l": 398.52341, "t": 432.04431, "r": 404.84271, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 438.36295, "r_x1": 404.84271, "r_y1": 438.36295, "r_x2": 404.84271, "r_y2": 432.04431, "r_x3": 398.52341, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 196, "label": "text", "bbox": { "l": 411.47604, "t": 432.04431, "r": 417.79532, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 438.36295, "r_x1": 417.79532, "r_y1": 438.36295, "r_x2": 417.79532, "r_y2": 432.04431, "r_x3": 411.47604, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 197, "label": "text", "bbox": { "l": 424.42865, "t": 432.04431, "r": 430.74796, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 438.36295, "r_x1": 430.74796, "r_y1": 438.36295, "r_x2": 430.74796, "r_y2": 432.04431, "r_x3": 424.42865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 198, "label": "text", "bbox": { "l": 437.38129, "t": 432.04431, "r": 443.70056, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 438.36295, "r_x1": 443.70056, "r_y1": 438.36295, "r_x2": 443.70056, "r_y2": 432.04431, "r_x3": 437.38129, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 199, "label": "text", "bbox": { "l": 450.33389000000005, "t": 432.04431, "r": 456.65319999999997, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 438.36295, "r_x1": 456.65319999999997, "r_y1": 438.36295, "r_x2": 456.65319999999997, "r_y2": 432.04431, "r_x3": 450.33389000000005, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 200, "label": "text", "bbox": { "l": 463.2865, "t": 432.04431, "r": 469.6058, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 438.36295, "r_x1": 469.6058, "r_y1": 438.36295, "r_x2": 469.6058, "r_y2": 432.04431, "r_x3": 463.2865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 201, "label": "text", "bbox": { "l": 476.23914, "t": 432.04431, "r": 482.55841, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 438.36295, "r_x1": 482.55841, "r_y1": 438.36295, "r_x2": 482.55841, "r_y2": 432.04431, "r_x3": 476.23914, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 202, "label": "text", "bbox": { "l": 489.1917700000001, "t": 432.04431, "r": 495.51105, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 438.36295, "r_x1": 495.51105, "r_y1": 438.36295, "r_x2": 495.51105, "r_y2": 432.04431, "r_x3": 489.1917700000001, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 203, "label": "text", "bbox": { "l": 502.14438, "t": 432.04431, "r": 508.46368, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 438.36295, "r_x1": 508.46368, "r_y1": 438.36295, "r_x2": 508.46368, "r_y2": 432.04431, "r_x3": 502.14438, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 204, "label": "text", "bbox": { "l": 515.09705, "t": 432.04431, "r": 521.41632, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 438.36295, "r_x1": 521.41632, "r_y1": 438.36295, "r_x2": 521.41632, "r_y2": 432.04431, "r_x3": 515.09705, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 205, "label": "text", "bbox": { "l": 528.04962, "t": 432.04431, "r": 534.3689, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 438.36295, "r_x1": 534.3689, "r_y1": 438.36295, "r_x2": 534.3689, "r_y2": 432.04431, "r_x3": 528.04962, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 206, "label": "text", "bbox": { "l": 385.2814, "t": 389.20004, "r": 388.44073, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 395.51868, "r_x1": 388.44073, "r_y1": 395.51868, "r_x2": 388.44073, "r_y2": 389.20004, "r_x3": 385.2814, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 207, "label": "text", "bbox": { "l": 398.52341, "t": 389.20004, "r": 401.68274, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 395.51868, "r_x1": 401.68274, "r_y1": 395.51868, "r_x2": 401.68274, "r_y2": 389.20004, "r_x3": 398.52341, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 208, "label": "text", "bbox": { "l": 411.4754, "t": 389.20004, "r": 414.63474, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.4754, "r_y0": 395.51868, "r_x1": 414.63474, "r_y1": 395.51868, "r_x2": 414.63474, "r_y2": 389.20004, "r_x3": 411.4754, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 209, "label": "text", "bbox": { "l": 424.4274, "t": 389.20004, "r": 427.58673, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.4274, "r_y0": 395.51868, "r_x1": 427.58673, "r_y1": 395.51868, "r_x2": 427.58673, "r_y2": 389.20004, "r_x3": 424.4274, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 210, "label": "text", "bbox": { "l": 437.37939, "t": 389.20004, "r": 440.53870000000006, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 395.51868, "r_x1": 440.53870000000006, "r_y1": 395.51868, "r_x2": 440.53870000000006, "r_y2": 389.20004, "r_x3": 437.37939, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 211, "label": "text", "bbox": { "l": 450.33136, "t": 389.20004, "r": 453.49069000000003, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33136, "r_y0": 395.51868, "r_x1": 453.49069000000003, "r_y1": 395.51868, "r_x2": 453.49069000000003, "r_y2": 389.20004, "r_x3": 450.33136, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 212, "label": "text", "bbox": { "l": 463.28336, "t": 389.20004, "r": 466.44269, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28336, "r_y0": 395.51868, "r_x1": 466.44269, "r_y1": 395.51868, "r_x2": 466.44269, "r_y2": 389.20004, "r_x3": 463.28336, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 213, "label": "text", "bbox": { "l": 476.23535, "t": 389.20004, "r": 479.39468, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23535, "r_y0": 395.51868, "r_x1": 479.39468, "r_y1": 395.51868, "r_x2": 479.39468, "r_y2": 389.20004, "r_x3": 476.23535, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 214, "label": "text", "bbox": { "l": 489.18735, "t": 389.20004, "r": 492.34668, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18735, "r_y0": 395.51868, "r_x1": 492.34668, "r_y1": 395.51868, "r_x2": 492.34668, "r_y2": 389.20004, "r_x3": 489.18735, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 215, "label": "text", "bbox": { "l": 502.13933999999995, "t": 389.20004, "r": 505.29868000000005, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.13933999999995, "r_y0": 395.51868, "r_x1": 505.29868000000005, "r_y1": 395.51868, "r_x2": 505.29868000000005, "r_y2": 389.20004, "r_x3": 502.13933999999995, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 216, "label": "text", "bbox": { "l": 515.09131, "t": 389.20004, "r": 521.41064, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09131, "r_y0": 395.51868, "r_x1": 521.41064, "r_y1": 395.51868, "r_x2": 521.41064, "r_y2": 389.20004, "r_x3": 515.09131, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 217, "label": "text", "bbox": { "l": 528.04364, "t": 389.20004, "r": 534.13104, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04364, "r_y0": 395.51868, "r_x1": 534.13104, "r_y1": 395.51868, "r_x2": 534.13104, "r_y2": 389.20004, "r_x3": 528.04364, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 218, "label": "text", "bbox": { "l": 385.2814, "t": 398.97464, "r": 391.60071, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 405.29327, "r_x1": 391.60071, "r_y1": 405.29327, "r_x2": 391.60071, "r_y2": 398.97464, "r_x3": 385.2814, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 219, "label": "text", "bbox": { "l": 398.52341, "t": 398.97464, "r": 404.84271, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 405.29327, "r_x1": 404.84271, "r_y1": 405.29327, "r_x2": 404.84271, "r_y2": 398.97464, "r_x3": 398.52341, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 220, "label": "text", "bbox": { "l": 411.47604, "t": 398.97464, "r": 417.79535, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 405.29327, "r_x1": 417.79535, "r_y1": 405.29327, "r_x2": 417.79535, "r_y2": 398.97464, "r_x3": 411.47604, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 221, "label": "text", "bbox": { "l": 424.42719, "t": 406.77463000000006, "r": 430.74648999999994, "b": 413.09326, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42719, "r_y0": 413.09326, "r_x1": 430.74648999999994, "r_y1": 413.09326, "r_x2": 430.74648999999994, "r_y2": 406.77463000000006, "r_x3": 424.42719, "r_y3": 406.77463000000006, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 222, "label": "text", "bbox": { "l": 502.86941999999993, "t": 410.99438, "r": 509.18871999999993, "b": 417.31302, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.86941999999993, "r_y0": 417.31302, "r_x1": 509.18871999999993, "r_y1": 417.31302, "r_x2": 509.18871999999993, "r_y2": 410.99438, "r_x3": 502.86941999999993, "r_y3": 410.99438, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 223, "label": "text", "bbox": { "l": 384.35437, "t": 381.77722, "r": 430.99261, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35437, "r_y0": 386.44281, "r_x1": 430.99261, "r_y1": 386.44281, "r_x2": 430.99261, "r_y2": 381.77722, "r_x3": 384.35437, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 62.595001, "t": 458.72836, "r": 532.63049, "b": 467.63492, "coord_origin": "TOPLEFT" }, "confidence": 0.9153602719306946, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.595001, "r_y0": 467.63492, "r_x1": 532.63049, "r_y1": 467.63492, "r_x2": 532.63049, "r_y2": 458.72836, "r_x3": 62.595001, "r_y3": 458.72836, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 50.112, "t": 491.39536, "r": 163.7558, "b": 501.24741, "coord_origin": "TOPLEFT" }, "confidence": 0.9561247229576111, "cells": [ { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 501.24741, "r_x1": 64.448898, "r_y1": 501.24741, "r_x2": 64.448898, "r_y2": 491.39536, "r_x3": 50.112, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.006828, "r_y0": 501.24741, "r_x1": 163.7558, "r_y1": 501.24741, "r_x2": 163.7558, "r_y2": 491.39536, "r_x3": 74.006828, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.5. Qualitative Analysis" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 536.87337, "r": 286.36511, "b": 713.1519470000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9852361679077148, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 545.77992, "r_x1": 286.36499, "r_y1": 545.77992, "r_x2": 286.36499, "r_y2": 536.87337, "r_x3": 62.067001, "r_y3": 536.87337, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 557.73492, "r_x1": 211.15741, "r_y1": 557.73492, "r_x2": 211.15741, "r_y2": 548.82837, "r_x3": 50.112, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.10000999999997, "r_y0": 557.50578, "r_x1": 259.17453, "r_y1": 557.50578, "r_x2": 259.17453, "r_y2": 548.91803, "r_x3": 215.10000999999997, "r_y3": 548.91803, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73492, "r_x1": 286.36273, "r_y1": 557.73492, "r_x2": 286.36273, "r_y2": 548.82837, "r_x3": 263.12, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 569.68993, "r_x1": 286.36505, "r_y1": 569.68993, "r_x2": 286.36505, "r_y2": 560.78337, "r_x3": 50.112, "r_y3": 560.78337, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 581.6449299999999, "r_x1": 286.36508, "r_y1": 581.6449299999999, "r_x2": 286.36508, "r_y2": 572.73837, "r_x3": 50.112, "r_y3": 572.73837, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 593.59993, "r_x1": 286.36508, "r_y1": 593.59993, "r_x2": 286.36508, "r_y2": 584.69337, "r_x3": 50.112, "r_y3": 584.69337, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 605.55592, "r_x1": 286.36505, "r_y1": 605.55592, "r_x2": 286.36505, "r_y2": 596.64937, "r_x3": 50.112, "r_y3": 596.64937, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 617.51093, "r_x1": 286.36508, "r_y1": 617.51093, "r_x2": 286.36508, "r_y2": 608.60437, "r_x3": 50.112, "r_y3": 608.60437, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 629.46593, "r_x1": 286.36508, "r_y1": 629.46593, "r_x2": 286.36508, "r_y2": 620.55937, "r_x3": 50.112, "r_y3": 620.55937, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 641.42093, "r_x1": 286.36508, "r_y1": 641.42093, "r_x2": 286.36508, "r_y2": 632.51437, "r_x3": 50.112, "r_y3": 632.51437, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 653.37593, "r_x1": 286.36508, "r_y1": 653.37593, "r_x2": 286.36508, "r_y2": 644.46938, "r_x3": 50.112, "r_y3": 644.46938, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 665.33094, "r_x1": 286.36511, "r_y1": 665.33094, "r_x2": 286.36511, "r_y2": 656.42438, "r_x3": 50.112, "r_y3": 656.42438, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 677.28694, "r_x1": 286.36508, "r_y1": 677.28694, "r_x2": 286.36508, "r_y2": 668.38037, "r_x3": 50.112, "r_y3": 668.38037, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 689.24194, "r_x1": 286.36511, "r_y1": 689.24194, "r_x2": 286.36511, "r_y2": 680.33537, "r_x3": 50.112, "r_y3": 680.33537, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 701.196945, "r_x1": 286.36511, "r_y1": 701.196945, "r_x2": 286.36511, "r_y2": 692.290375, "r_x3": 50.112, "r_y3": 692.290375, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.1519470000001, "r_x1": 226.88833999999997, "r_y1": 713.1519470000001, "r_x2": 226.88833999999997, "r_y2": 704.245377, "r_x3": 50.112, "r_y3": 704.245377, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type." }, { "label": "section_header", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 308.862, "t": 490.70892, "r": 460.84848, "b": 501.45663, "coord_origin": "TOPLEFT" }, "confidence": 0.9436525702476501, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 501.45663, "r_x1": 316.07382, "r_y1": 501.45663, "r_x2": 316.07382, "r_y2": 490.70892, "r_x3": 308.862, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.68954, "r_y0": 501.45663, "r_x1": 460.84848, "r_y1": 501.45663, "r_x2": 460.84848, "r_y2": 490.70892, "r_x3": 325.68954, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Future Work & Conclusion" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 512.89337, "r": 545.11517, "b": 653.30592, "coord_origin": "TOPLEFT" }, "confidence": 0.9875594973564148, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 521.79993, "r_x1": 545.11505, "r_y1": 521.79993, "r_x2": 545.11505, "r_y2": 512.89337, "r_x3": 320.81699, "r_y3": 512.89337, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.75491, "r_x1": 545.11517, "r_y1": 533.75491, "r_x2": 545.11517, "r_y2": 524.84836, "r_x3": 308.862, "r_y3": 524.84836, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.70992, "r_x1": 545.11511, "r_y1": 545.70992, "r_x2": 545.11511, "r_y2": 536.80336, "r_x3": 308.862, "r_y3": 536.80336, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.6649199999999, "r_x1": 545.11505, "r_y1": 557.6649199999999, "r_x2": 545.11505, "r_y2": 548.75836, "r_x3": 308.862, "r_y3": 548.75836, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.61992, "r_x1": 545.11517, "r_y1": 569.61992, "r_x2": 545.11517, "r_y2": 560.71336, "r_x3": 308.862, "r_y3": 560.71336, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.57492, "r_x1": 545.11511, "r_y1": 581.57492, "r_x2": 545.11511, "r_y2": 572.66837, "r_x3": 308.862, "r_y3": 572.66837, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.53091, "r_x1": 545.11511, "r_y1": 593.53091, "r_x2": 545.11511, "r_y2": 584.62436, "r_x3": 308.862, "r_y3": 584.62436, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.48592, "r_x1": 400.46808, "r_y1": 605.48592, "r_x2": 400.46808, "r_y2": 596.57936, "r_x3": 308.862, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.37839, "r_y0": 605.48592, "r_x1": 545.11511, "r_y1": 605.48592, "r_x2": 545.11511, "r_y2": 596.57936, "r_x3": 408.37839, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.44092, "r_x1": 545.11505, "r_y1": 617.44092, "r_x2": 545.11505, "r_y2": 608.53436, "r_x3": 308.862, "r_y3": 608.53436, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.3959199999999, "r_x1": 545.11511, "r_y1": 629.3959199999999, "r_x2": 545.11511, "r_y2": 620.48936, "r_x3": 308.862, "r_y3": 620.48936, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.35092, "r_x1": 545.11505, "r_y1": 641.35092, "r_x2": 545.11505, "r_y2": 632.4443699999999, "r_x3": 308.862, "r_y3": 632.4443699999999, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.30592, "r_x1": 365.85803, "r_y1": 653.30592, "r_x2": 365.85803, "r_y2": 644.39937, "r_x3": 308.862, "r_y3": 644.39937, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 308.862, "t": 672.09892, "r": 364.40585, "b": 682.84664, "coord_origin": "TOPLEFT" }, "confidence": 0.9442470073699951, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 682.84664, "r_x1": 364.40585, "r_y1": 682.84664, "r_x2": 364.40585, "r_y2": 672.09892, "r_x3": 308.862, "r_y3": 672.09892, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 10, "page_no": 7, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 313.345, "t": 693.9617920000001, "r": 545.1134, "b": 712.936752, "coord_origin": "TOPLEFT" }, "confidence": 0.8318753838539124, "cells": [ { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.345, "r_y0": 701.977753, "r_x1": 323.80792, "r_y1": 701.977753, "r_x2": 323.80792, "r_y2": 693.9617920000001, "r_x3": 313.345, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05127, "r_y0": 701.977753, "r_x1": 545.10852, "r_y1": 701.977753, "r_x2": 545.10852, "r_y2": 693.9617920000001, "r_x3": 326.05127, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 712.936752, "r_x1": 545.1134, "r_y1": 712.936752, "r_x2": 545.1134, "r_y2": 704.920792, "r_x3": 328.78101, "r_y3": 704.920792, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-" }, { "label": "page_footer", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133366, "r": 300.10229, "b": 743.039928, "coord_origin": "TOPLEFT" }, "confidence": 0.8709858059883118, "cells": [ { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "picture", "id": 15, "page_no": 7, "cluster": { "id": 15, "label": "picture", "bbox": { "l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT" }, "confidence": 0.7699173092842102, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 14, "page_no": 7, "cluster": { "id": 14, "label": "picture", "bbox": { "l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT" }, "confidence": 0.7873926162719727, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 18, "page_no": 7, "cluster": { "id": 18, "label": "caption", "bbox": { "l": 53.811783000000005, "t": 208.23328000000004, "r": 385.93451, "b": 216.10645, "coord_origin": "TOPLEFT" }, "confidence": 0.5986505746841431, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 216.10645, "r_x1": 62.219952, "r_y1": 216.10645, "r_x2": 62.219952, "r_y2": 208.23328000000004, "r_x3": 53.811783000000005, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.424026, "r_y0": 216.10645, "r_x1": 385.93451, "r_y1": 216.10645, "r_x2": 385.93451, "r_y2": 208.23328000000004, "r_x3": 66.424026, "r_y3": 208.23328000000004, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:" }, { "label": "section_header", "id": 29, "page_no": 7, "cluster": { "id": 29, "label": "section_header", "bbox": { "l": 53.811783000000005, "t": 94.28112999999996, "r": 284.34592, "b": 102.15430000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.46452972292900085, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.811783000000005, "r_y0": 102.15430000000003, "r_x1": 284.34592, "r_y1": 102.15430000000003, "r_x2": 284.34592, "r_y2": 94.28112999999996, "r_x3": 53.811783000000005, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Japanese language (previously unseen by TableFormer):" }, { "label": "section_header", "id": 31, "page_no": 7, "cluster": { "id": 31, "label": "section_header", "bbox": { "l": 304.83081, "t": 94.28112999999996, "r": 431.09119, "b": 102.15430000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.4629225730895996, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83081, "r_y0": 102.15430000000003, "r_x1": 431.09119, "r_y1": 102.15430000000003, "r_x2": 431.09119, "r_y2": 94.28112999999996, "r_x3": 304.83081, "r_y3": 94.28112999999996, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Example table from FinTabNet:" }, { "label": "list_item", "id": 20, "page_no": 7, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 53.286037, "t": 78.68756000000008, "r": 61.550289, "b": 86.56073000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.5820134282112122, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.286037, "r_y0": 86.56073000000004, "r_x1": 61.550289, "r_y1": 86.56073000000004, "r_x2": 61.550289, "r_y2": 78.68756000000008, "r_x3": 53.286037, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a." }, { "label": "list_item", "id": 21, "page_no": 7, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 65.682419, "t": 78.68756000000008, "r": 499.55563, "b": 86.56073000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.541211724281311, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.682419, "r_y0": 86.56073000000004, "r_x1": 499.55563, "r_y1": 86.56073000000004, "r_x2": 499.55563, "r_y2": 78.68756000000008, "r_x3": 65.682419, "r_y3": 78.68756000000008, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells" }, { "label": "table", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "table", "bbox": { "l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT" }, "confidence": 0.8824009299278259, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93285, "t": 222.18073000000004, "r": 241.04458999999997, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93285, "r_y0": 226.36212, "r_x1": 241.04458999999997, "r_y1": 226.36212, "r_x2": 241.04458999999997, "r_y2": 222.18073000000004, "r_x3": 209.93285, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76489, "t": 222.18073000000004, "r": 284.50589, "b": 226.36212, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76489, "r_y0": 226.36212, "r_x1": 284.50589, "r_y1": 226.36212, "r_x2": 284.50589, "r_y2": 222.18073000000004, "r_x3": 263.76489, "r_y3": 222.18073000000004, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.24990999999999, "t": 229.66594999999995, "r": 120.62018, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.24990999999999, "r_y0": 233.84735, "r_x1": 120.62018, "r_y1": 233.84735, "r_x2": 120.62018, "r_y2": 229.66594999999995, "r_x3": 110.24990999999999, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.36609, "t": 229.66594999999995, "r": 196.1071, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.36609, "r_y0": 233.84735, "r_x1": 196.1071, "r_y1": 233.84735, "r_x2": 196.1071, "r_y2": 229.66594999999995, "r_x3": 175.36609, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.10756, "t": 229.66594999999995, "r": 201.29247, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.10756, "r_y0": 233.84735, "r_x1": 201.29247, "r_y1": 233.84735, "r_x2": 201.29247, "r_y2": 229.66594999999995, "r_x3": 196.10756, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62408, "t": 229.66594999999995, "r": 219.99435, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62408, "r_y0": 233.84735, "r_x1": 219.99435, "r_y1": 233.84735, "r_x2": 219.99435, "r_y2": 229.66594999999995, "r_x3": 209.62408, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.19814, "t": 229.66594999999995, "r": 244.75377, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.19814, "r_y0": 233.84735, "r_x1": 244.75377, "r_y1": 233.84735, "r_x2": 244.75377, "r_y2": 229.66594999999995, "r_x3": 229.19814, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.1142, "t": 229.66594999999995, "r": 266.48447, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.1142, "r_y0": 233.84735, "r_x1": 266.48447, "r_y1": 233.84735, "r_x2": 266.48447, "r_y2": 229.66594999999995, "r_x3": 256.1142, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38434, "t": 229.66594999999995, "r": 293.93997, "b": 233.84735, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38434, "r_y0": 233.84735, "r_x1": 293.93997, "r_y1": 233.84735, "r_x2": 293.93997, "r_y2": 229.66594999999995, "r_x3": 278.38434, "r_y3": 229.66594999999995, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53052099999999, "t": 236.42584, "r": 162.7131, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 240.78375000000005, "r_x1": 162.7131, "r_y1": 240.78375000000005, "r_x2": 162.7131, "r_y2": 236.42584, "r_x3": 55.53052099999999, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.39731, "t": 236.42584, "r": 189.56456, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 240.78375000000005, "r_x1": 189.56456, "r_y1": 240.78375000000005, "r_x2": 189.56456, "r_y2": 236.42584, "r_x3": 184.39731, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99026, "t": 236.42584, "r": 214.15752, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 240.78375000000005, "r_x1": 214.15752, "r_y1": 240.78375000000005, "r_x2": 214.15752, "r_y2": 236.42584, "r_x3": 208.99026, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.87517, "t": 236.42584, "r": 237.45833000000002, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 240.78375000000005, "r_x1": 237.45833000000002, "r_y1": 240.78375000000005, "r_x2": 237.45833000000002, "r_y2": 236.42584, "r_x3": 234.87517, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88446, "t": 236.42584, "r": 264.6358, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 240.78375000000005, "r_x1": 264.6358, "r_y1": 240.78375000000005, "r_x2": 264.6358, "r_y2": 236.42584, "r_x3": 256.88446, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06134, "t": 236.42584, "r": 286.6445, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 240.78375000000005, "r_x1": 286.6445, "r_y1": 240.78375000000005, "r_x2": 286.6445, "r_y2": 236.42584, "r_x3": 284.06134, "r_y3": 236.42584, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53052099999999, "t": 242.62048000000004, "r": 139.72253, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 246.97839, "r_x1": 139.72253, "r_y1": 246.97839, "r_x2": 139.72253, "r_y2": 242.62048000000004, "r_x3": 55.53052099999999, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.10536, "t": 242.62048000000004, "r": 190.8567, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 246.97839, "r_x1": 190.8567, "r_y1": 246.97839, "r_x2": 190.8567, "r_y2": 242.62048000000004, "r_x3": 183.10536, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.69832, "t": 242.62048000000004, "r": 215.44965999999997, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 246.97839, "r_x1": 215.44965999999997, "r_y1": 246.97839, "r_x2": 215.44965999999997, "r_y2": 242.62048000000004, "r_x3": 207.69832, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.87517, "t": 242.62048000000004, "r": 237.45833000000002, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.87517, "r_y0": 246.97839, "r_x1": 237.45833000000002, "r_y1": 246.97839, "r_x2": 237.45833000000002, "r_y2": 242.62048000000004, "r_x3": 234.87517, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88446, "t": 242.62048000000004, "r": 264.6358, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 246.97839, "r_x1": 264.6358, "r_y1": 246.97839, "r_x2": 264.6358, "r_y2": 242.62048000000004, "r_x3": 256.88446, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06134, "t": 242.62048000000004, "r": 286.6445, "b": 246.97839, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06134, "r_y0": 246.97839, "r_x1": 286.6445, "r_y1": 246.97839, "r_x2": 286.6445, "r_y2": 242.62048000000004, "r_x3": 284.06134, "r_y3": 242.62048000000004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53052099999999, "t": 249.79845999999998, "r": 97.013, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 253.97986000000003, "r_x1": 97.013, "r_y1": 253.97986000000003, "r_x2": 97.013, "r_y2": 249.79845999999998, "r_x3": 55.53052099999999, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.698288, "t": 249.58942000000002, "r": 103.03371, "b": 253.94732999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.698288, "r_y0": 253.94732999999997, "r_x1": 103.03371, "r_y1": 253.94732999999997, "r_x2": 103.03371, "r_y2": 249.58942000000002, "r_x3": 92.698288, "r_y3": 249.58942000000002, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03389, "t": 249.79845999999998, "r": 128.96027, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03389, "r_y0": 253.97986000000003, "r_x1": 128.96027, "r_y1": 253.97986000000003, "r_x2": 128.96027, "r_y2": 249.79845999999998, "r_x3": 103.03389, "r_y3": 249.79845999999998, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.10536, "t": 248.81506000000002, "r": 190.8567, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 253.17296999999996, "r_x1": 190.8567, "r_y1": 253.17296999999996, "r_x2": 190.8567, "r_y2": 248.81506000000002, "r_x3": 183.10536, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28223, "t": 248.81506000000002, "r": 212.86539, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 253.17296999999996, "r_x1": 212.86539, "r_y1": 253.17296999999996, "r_x2": 212.86539, "r_y2": 248.81506000000002, "r_x3": 210.28223, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29153, "t": 248.81506000000002, "r": 240.04287999999997, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 253.17296999999996, "r_x1": 240.04287999999997, "r_y1": 253.17296999999996, "r_x2": 240.04287999999997, "r_y2": 248.81506000000002, "r_x3": 232.29153, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88446, "t": 248.81506000000002, "r": 264.6358, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 253.17296999999996, "r_x1": 264.6358, "r_y1": 253.17296999999996, "r_x2": 264.6358, "r_y2": 248.81506000000002, "r_x3": 256.88446, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.47742, "t": 248.81506000000002, "r": 289.22876, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 253.17296999999996, "r_x1": 289.22876, "r_y1": 253.17296999999996, "r_x2": 289.22876, "r_y2": 248.81506000000002, "r_x3": 281.47742, "r_y3": 248.81506000000002, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53052099999999, "t": 257.28369, "r": 91.827637, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 261.46509000000003, "r_x1": 91.827637, "r_y1": 261.46509000000003, "r_x2": 91.827637, "r_y2": 257.28369, "r_x3": 55.53052099999999, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.052673, "t": 257.07465, "r": 93.219925, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.052673, "r_y0": 261.43255999999997, "r_x1": 93.219925, "r_y1": 261.43255999999997, "r_x2": 93.219925, "r_y2": 257.07465, "r_x3": 88.052673, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.220474, "t": 257.28369, "r": 119.14685, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.220474, "r_y0": 261.46509000000003, "r_x1": 119.14685, "r_y1": 261.46509000000003, "r_x2": 119.14685, "r_y2": 257.28369, "r_x3": 93.220474, "r_y3": 257.28369, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45073999999998, "t": 257.07465, "r": 129.88177, "b": 261.43255999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 261.43255999999997, "r_x1": 129.88177, "r_y1": 261.43255999999997, "r_x2": 129.88177, "r_y2": 257.07465, "r_x3": 116.45073999999998, "r_y3": 257.07465, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.10536, "t": 256.30029, "r": 190.8567, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 260.65819999999997, "r_x1": 190.8567, "r_y1": 260.65819999999997, "r_x2": 190.8567, "r_y2": 256.30029, "r_x3": 183.10536, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28223, "t": 256.30029, "r": 212.86539, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 260.65819999999997, "r_x1": 212.86539, "r_y1": 260.65819999999997, "r_x2": 212.86539, "r_y2": 256.30029, "r_x3": 210.28223, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29153, "t": 256.30029, "r": 240.04287999999997, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 260.65819999999997, "r_x1": 240.04287999999997, "r_y1": 260.65819999999997, "r_x2": 240.04287999999997, "r_y2": 256.30029, "r_x3": 232.29153, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88446, "t": 256.30029, "r": 264.6358, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 260.65819999999997, "r_x1": 264.6358, "r_y1": 260.65819999999997, "r_x2": 264.6358, "r_y2": 256.30029, "r_x3": 256.88446, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.47742, "t": 256.30029, "r": 289.22876, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 260.65819999999997, "r_x1": 289.22876, "r_y1": 260.65819999999997, "r_x2": 289.22876, "r_y2": 256.30029, "r_x3": 281.47742, "r_y3": 256.30029, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53052099999999, "t": 264.5108, "r": 60.715424, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 268.69219999999996, "r_x1": 60.715424, "r_y1": 268.69219999999996, "r_x2": 60.715424, "r_y2": 264.5108, "r_x3": 55.53052099999999, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.17654799999999, "t": 264.30175999999994, "r": 65.343796, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.17654799999999, "r_y0": 268.65967, "r_x1": 65.343796, "r_y1": 268.65967, "r_x2": 65.343796, "r_y2": 264.30175999999994, "r_x3": 60.17654799999999, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.344376, "t": 264.5108, "r": 122.38297000000001, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.344376, "r_y0": 268.69219999999996, "r_x1": 122.38297000000001, "r_y1": 268.69219999999996, "r_x2": 122.38297000000001, "r_y2": 264.5108, "r_x3": 65.344376, "r_y3": 264.5108, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45073999999998, "t": 264.30175999999994, "r": 129.88177, "b": 268.65967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45073999999998, "r_y0": 268.65967, "r_x1": 129.88177, "r_y1": 268.65967, "r_x2": 129.88177, "r_y2": 264.30175999999994, "r_x3": 116.45073999999998, "r_y3": 264.30175999999994, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.10536, "t": 263.52739999999994, "r": 190.8567, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 267.88531, "r_x1": 190.8567, "r_y1": 267.88531, "r_x2": 190.8567, "r_y2": 263.52739999999994, "r_x3": 183.10536, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28223, "t": 263.52739999999994, "r": 212.86539, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 267.88531, "r_x1": 212.86539, "r_y1": 267.88531, "r_x2": 212.86539, "r_y2": 263.52739999999994, "r_x3": 210.28223, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29153, "t": 263.52739999999994, "r": 240.04287999999997, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 267.88531, "r_x1": 240.04287999999997, "r_y1": 267.88531, "r_x2": 240.04287999999997, "r_y2": 263.52739999999994, "r_x3": 232.29153, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88446, "t": 263.52739999999994, "r": 264.6358, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 267.88531, "r_x1": 264.6358, "r_y1": 267.88531, "r_x2": 264.6358, "r_y2": 263.52739999999994, "r_x3": 256.88446, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.47742, "t": 263.52739999999994, "r": 289.22876, "b": 267.88531, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 267.88531, "r_x1": 289.22876, "r_y1": 267.88531, "r_x2": 289.22876, "r_y2": 263.52739999999994, "r_x3": 281.47742, "r_y3": 263.52739999999994, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53052099999999, "t": 271.73785, "r": 107.38374, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 275.91925000000003, "r_x1": 107.38374, "r_y1": 275.91925000000003, "r_x2": 107.38374, "r_y2": 271.73785, "r_x3": 55.53052099999999, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99034, "t": 271.52881, "r": 109.74168000000002, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99034, "r_y0": 275.88671999999997, "r_x1": 109.74168000000002, "r_y1": 275.88671999999997, "r_x2": 109.74168000000002, "r_y2": 271.52881, "r_x3": 101.99034, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74204, "t": 271.73785, "r": 114.92695000000002, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74204, "r_y0": 275.91925000000003, "r_x1": 114.92695000000002, "r_y1": 275.91925000000003, "r_x2": 114.92695000000002, "r_y2": 271.73785, "r_x3": 109.74204, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.38793, "t": 271.52881, "r": 122.13927, "b": 275.88671999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.38793, "r_y0": 275.88671999999997, "r_x1": 122.13927, "r_y1": 275.88671999999997, "r_x2": 122.13927, "r_y2": 271.52881, "r_x3": 114.38793, "r_y3": 271.52881, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.13963, "t": 271.73785, "r": 127.32454000000001, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.13963, "r_y0": 275.91925000000003, "r_x1": 127.32454000000001, "r_y1": 275.91925000000003, "r_x2": 127.32454000000001, "r_y2": 271.73785, "r_x3": 122.13963, "r_y3": 271.73785, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.39731, "t": 270.75446, "r": 189.56456, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.39731, "r_y0": 275.11237000000006, "r_x1": 189.56456, "r_y1": 275.11237000000006, "r_x2": 189.56456, "r_y2": 270.75446, "r_x3": 184.39731, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28223, "t": 270.75446, "r": 212.86539, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28223, "r_y0": 275.11237000000006, "r_x1": 212.86539, "r_y1": 275.11237000000006, "r_x2": 212.86539, "r_y2": 270.75446, "r_x3": 210.28223, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58348, "t": 270.75446, "r": 238.75072999999998, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 275.11237000000006, "r_x1": 238.75072999999998, "r_y1": 275.11237000000006, "r_x2": 238.75072999999998, "r_y2": 270.75446, "r_x3": 233.58348, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88446, "t": 270.75446, "r": 264.6358, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 275.11237000000006, "r_x1": 264.6358, "r_y1": 275.11237000000006, "r_x2": 264.6358, "r_y2": 270.75446, "r_x3": 256.88446, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.47742, "t": 270.75446, "r": 289.22876, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 275.11237000000006, "r_x1": 289.22876, "r_y1": 275.11237000000006, "r_x2": 289.22876, "r_y2": 270.75446, "r_x3": 281.47742, "r_y3": 270.75446, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53052099999999, "t": 279.01392, "r": 68.68605, "b": 283.37183, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53052099999999, "r_y0": 283.37183, "r_x1": 68.68605, "r_y1": 283.37183, "r_x2": 68.68605, "r_y2": 279.01392, "r_x3": 55.53052099999999, "r_y3": 279.01392, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.685814, "t": 279.22295999999994, "r": 110.16829999999999, "b": 283.40436, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.685814, "r_y0": 283.40436, "r_x1": 110.16829999999999, "r_y1": 283.40436, "r_x2": 110.16829999999999, "r_y2": 279.22295999999994, "r_x3": 68.685814, "r_y3": 279.22295999999994, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.10536, "t": 277.98157000000003, "r": 190.8567, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 282.33948000000004, "r_x1": 190.8567, "r_y1": 282.33948000000004, "r_x2": 190.8567, "r_y2": 277.98157000000003, "r_x3": 183.10536, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99026, "t": 277.98157000000003, "r": 214.15752, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99026, "r_y0": 282.33948000000004, "r_x1": 214.15752, "r_y1": 282.33948000000004, "r_x2": 214.15752, "r_y2": 277.98157000000003, "r_x3": 208.99026, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58348, "t": 277.98157000000003, "r": 238.75072999999998, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58348, "r_y0": 282.33948000000004, "r_x1": 238.75072999999998, "r_y1": 282.33948000000004, "r_x2": 238.75072999999998, "r_y2": 277.98157000000003, "r_x3": 233.58348, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88446, "t": 277.98157000000003, "r": 264.6358, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88446, "r_y0": 282.33948000000004, "r_x1": 264.6358, "r_y1": 282.33948000000004, "r_x2": 264.6358, "r_y2": 277.98157000000003, "r_x3": 256.88446, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.76938, "t": 277.98157000000003, "r": 287.93661, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.76938, "r_y0": 282.33948000000004, "r_x1": 287.93661, "r_y1": 282.33948000000004, "r_x2": 287.93661, "r_y2": 277.98157000000003, "r_x3": 282.76938, "r_y3": 277.98157000000003, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.61508, "t": 286.45004, "r": 174.79999, "b": 290.63141, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.61508, "r_y0": 290.63141, "r_x1": 174.79999, "r_y1": 290.63141, "r_x2": 174.79999, "r_y2": 286.45004, "r_x3": 169.61508, "r_y3": 286.45004, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.10536, "t": 285.46667, "r": 190.8567, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.10536, "r_y0": 289.8245800000001, "r_x1": 190.8567, "r_y1": 289.8245800000001, "r_x2": 190.8567, "r_y2": 285.46667, "r_x3": 183.10536, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.69832, "t": 285.46667, "r": 215.44965999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.69832, "r_y0": 289.8245800000001, "r_x1": 215.44965999999997, "r_y1": 289.8245800000001, "r_x2": 215.44965999999997, "r_y2": 285.46667, "r_x3": 207.69832, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29153, "t": 285.46667, "r": 240.04287999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29153, "r_y0": 289.8245800000001, "r_x1": 240.04287999999997, "r_y1": 289.8245800000001, "r_x2": 240.04287999999997, "r_y2": 285.46667, "r_x3": 232.29153, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.76506, "t": 285.46667, "r": 265.75204, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.76506, "r_y0": 289.8245800000001, "r_x1": 265.75204, "r_y1": 289.8245800000001, "r_x2": 265.75204, "r_y2": 285.46667, "r_x3": 255.76506, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.47742, "t": 285.46667, "r": 289.22876, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.47742, "r_y0": 289.8245800000001, "r_x1": 289.22876, "r_y1": 289.8245800000001, "r_x2": 289.22876, "r_y2": 285.46667, "r_x3": 281.47742, "r_y3": 285.46667, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 10, "num_cols": 6, "table_cells": [ { "bbox": { "l": 209.93285, "t": 222.18073000000004, "r": 241.04458999999997, "b": 226.36212, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 263.76489, "t": 222.18073000000004, "r": 284.50589, "b": 226.36212, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 110.24990999999999, "t": 229.66594999999995, "r": 120.62018, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 175.36609, "t": 229.66594999999995, "r": 196.1071, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb \u6570", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 209.62408, "t": 229.66594999999995, "r": 219.99435, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 229.19814, "t": 229.66594999999995, "r": 244.75377, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 256.1142, "t": 229.66594999999995, "r": 266.48447, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 278.38434, "t": 229.66594999999995, "r": 293.93997, "b": 233.84735, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 236.42584, "r": 162.7131, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.39731, "t": 236.42584, "r": 189.56456, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99026, "t": 236.42584, "r": 214.15752, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.87517, "t": 236.42584, "r": 237.45833000000002, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 236.42584, "r": 264.6358, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06134, "t": 236.42584, "r": 286.6445, "b": 240.78375000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 242.62048000000004, "r": 139.72253, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 242.62048000000004, "r": 190.8567, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.69832, "t": 242.62048000000004, "r": 215.44965999999997, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.87517, "t": 242.62048000000004, "r": 237.45833000000002, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 242.62048000000004, "r": 264.6358, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06134, "t": 242.62048000000004, "r": 286.6445, "b": 246.97839, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 249.79845999999998, "r": 97.013, "b": 253.97986000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 248.81506000000002, "r": 190.8567, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 248.81506000000002, "r": 212.86539, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 248.81506000000002, "r": 240.04287999999997, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 248.81506000000002, "r": 264.6358, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 248.81506000000002, "r": 289.22876, "b": 253.17296999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 257.28369, "r": 91.827637, "b": 261.46509000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 256.30029, "r": 190.8567, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 256.30029, "r": 212.86539, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 256.30029, "r": 240.04287999999997, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 256.30029, "r": 264.6358, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 256.30029, "r": 289.22876, "b": 260.65819999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 264.5108, "r": 60.715424, "b": 268.69219999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 263.52739999999994, "r": 190.8567, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 263.52739999999994, "r": 212.86539, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 263.52739999999994, "r": 240.04287999999997, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 263.52739999999994, "r": 264.6358, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 263.52739999999994, "r": 289.22876, "b": 267.88531, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 271.73785, "r": 107.38374, "b": 275.91925000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.39731, "t": 270.75446, "r": 189.56456, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28223, "t": 270.75446, "r": 212.86539, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58348, "t": 270.75446, "r": 238.75072999999998, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 270.75446, "r": 264.6358, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 270.75446, "r": 289.22876, "b": 275.11237000000006, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53052099999999, "t": 279.01392, "r": 68.68605, "b": 283.37183, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 277.98157000000003, "r": 190.8567, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99026, "t": 277.98157000000003, "r": 214.15752, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58348, "t": 277.98157000000003, "r": 238.75072999999998, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88446, "t": 277.98157000000003, "r": 264.6358, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 282.76938, "t": 277.98157000000003, "r": 287.93661, "b": 282.33948000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 169.61508, "t": 286.45004, "r": 174.79999, "b": 290.63141, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.10536, "t": 285.46667, "r": 190.8567, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.69832, "t": 285.46667, "r": 215.44965999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29153, "t": 285.46667, "r": 240.04287999999997, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 255.76506, "t": 285.46667, "r": 265.75204, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.47742, "t": 285.46667, "r": 289.22876, "b": 289.8245800000001, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 16, "page_no": 7, "cluster": { "id": 16, "label": "caption", "bbox": { "l": 380.42731, "t": 292.30426, "r": 549.42175, "b": 298.60284, "coord_origin": "TOPLEFT" }, "confidence": 0.7499915957450867, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.42731, "r_y0": 298.60284, "r_x1": 549.42175, "r_y1": 298.60284, "r_x2": 549.42175, "r_y2": 292.30426, "r_x3": 380.42731, "r_y3": 292.30426, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Text is aligned to match original for ease of viewing" }, { "label": "table", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "table", "bbox": { "l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8899767994880676, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.04861, "t": 221.62415, "r": 542.00018, "b": 226.68933000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.04861, "r_y0": 226.68933000000004, "r_x1": 542.00018, "r_y1": 226.68933000000004, "r_x2": 542.00018, "r_y2": 221.62415, "r_x3": 459.04861, "r_y3": 221.62415, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82193, "t": 227.83416999999997, "r": 507.2258, "b": 232.89935000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82193, "r_y0": 232.89935000000003, "r_x1": 507.2258, "r_y1": 232.89935000000003, "r_x2": 507.2258, "r_y2": 227.83416999999997, "r_x3": 493.82193, "r_y3": 227.83416999999997, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.2442, "t": 236.74712999999997, "r": 400.74588, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.2442, "r_y0": 241.81232, "r_x1": 400.74588, "r_y1": 241.81232, "r_x2": 400.74588, "r_y2": 236.74712999999997, "r_x3": 393.2442, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.74643, "t": 236.74712999999997, "r": 404.64523, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.74643, "r_y0": 241.81232, "r_x1": 404.64523, "r_y1": 241.81232, "r_x2": 404.64523, "r_y2": 236.74712999999997, "r_x3": 400.74643, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.6463, "t": 236.74712999999997, "r": 407.34631, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.6463, "r_y0": 241.81232, "r_x1": 407.34631, "r_y1": 241.81232, "r_x2": 407.34631, "r_y2": 236.74712999999997, "r_x3": 404.6463, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.09671, "t": 221.57446000000004, "r": 438.0145, "b": 226.63964999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.09671, "r_y0": 226.63964999999996, "r_x1": 438.0145, "r_y1": 226.63964999999996, "r_x2": 438.0145, "r_y2": 221.57446000000004, "r_x3": 392.09671, "r_y3": 221.57446000000004, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18323, "t": 236.74712999999997, "r": 440.98778999999996, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18323, "r_y0": 241.81232, "r_x1": 440.98778999999996, "r_y1": 241.81232, "r_x2": 440.98778999999996, "r_y2": 236.74712999999997, "r_x3": 427.18323, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38254, "t": 236.74712999999997, "r": 482.48465000000004, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38254, "r_y0": 241.81232, "r_x1": 482.48465000000004, "r_y1": 241.81232, "r_x2": 482.48465000000004, "r_y2": 236.74712999999997, "r_x3": 468.38254, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.92578, "t": 236.74712999999997, "r": 530.73035, "b": 241.81232, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.92578, "r_y0": 241.81232, "r_x1": 530.73035, "r_y1": 241.81232, "r_x2": 530.73035, "r_y2": 236.74712999999997, "r_x3": 516.92578, "r_y3": 236.74712999999997, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11493, "t": 244.61084000000005, "r": 355.6532, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 249.67602999999997, "r_x1": 355.6532, "r_y1": 249.67602999999997, "r_x2": 355.6532, "r_y2": 244.61084000000005, "r_x3": 306.11493, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65427, "t": 244.61084000000005, "r": 364.65607, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65427, "r_y0": 249.67602999999997, "r_x1": 364.65607, "r_y1": 249.67602999999997, "r_x2": 364.65607, "r_y2": 244.61084000000005, "r_x3": 355.65427, "r_y3": 244.61084000000005, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.24661, "t": 244.91327, "r": 400.75238, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 249.97844999999995, "r_x1": 400.75238, "r_y1": 249.97844999999995, "r_x2": 400.75238, "r_y2": 244.91327, "r_x3": 396.24661, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.7529, "t": 244.91327, "r": 403.75531, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 249.97844999999995, "r_x1": 403.75531, "r_y1": 249.97844999999995, "r_x2": 403.75531, "r_y2": 244.91327, "r_x3": 400.7529, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.81838999999997, "t": 244.91327, "r": 437.32708999999994, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 249.97844999999995, "r_x1": 437.32708999999994, "r_y1": 249.97844999999995, "r_x2": 437.32708999999994, "r_y2": 244.91327, "r_x3": 429.81838999999997, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.52859, "t": 244.91327, "r": 478.40103, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.52859, "r_y0": 249.97844999999995, "r_x1": 478.40103, "r_y1": 249.97844999999995, "r_x2": 478.40103, "r_y2": 244.91327, "r_x3": 465.52859, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.97552, "t": 244.91327, "r": 483.55001999999996, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.97552, "r_y0": 249.97844999999995, "r_x1": 483.55001999999996, "r_y1": 249.97844999999995, "r_x2": 483.55001999999996, "r_y2": 244.91327, "r_x3": 480.97552, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.44824, "t": 244.91327, "r": 531.46967, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.44824, "r_y0": 249.97844999999995, "r_x1": 531.46967, "r_y1": 249.97844999999995, "r_x2": 531.46967, "r_y2": 244.91327, "r_x3": 513.44824, "r_y3": 244.91327, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11493, "t": 253.68451000000005, "r": 325.62674, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 258.74969, "r_x1": 325.62674, "r_y1": 258.74969, "r_x2": 325.62674, "r_y2": 253.68451000000005, "r_x3": 306.11493, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.24661, "t": 253.68451000000005, "r": 400.75238, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 258.74969, "r_x1": 400.75238, "r_y1": 258.74969, "r_x2": 400.75238, "r_y2": 253.68451000000005, "r_x3": 396.24661, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.7529, "t": 253.68451000000005, "r": 403.75531, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.7529, "r_y0": 258.74969, "r_x1": 403.75531, "r_y1": 258.74969, "r_x2": 403.75531, "r_y2": 253.68451000000005, "r_x3": 400.7529, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.81838999999997, "t": 253.68451000000005, "r": 437.32708999999994, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.81838999999997, "r_y0": 258.74969, "r_x1": 437.32708999999994, "r_y1": 258.74969, "r_x2": 437.32708999999994, "r_y2": 253.68451000000005, "r_x3": 429.81838999999997, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.43579000000005, "t": 253.68451000000005, "r": 482.54831, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.43579000000005, "r_y0": 258.74969, "r_x1": 482.54831, "r_y1": 258.74969, "r_x2": 482.54831, "r_y2": 253.68451000000005, "r_x3": 466.43579000000005, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29065, "t": 253.68451000000005, "r": 530.80981, "b": 258.74969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29065, "r_y0": 258.74969, "r_x1": 530.80981, "r_y1": 258.74969, "r_x2": 530.80981, "r_y2": 253.68451000000005, "r_x3": 514.29065, "r_y3": 253.68451000000005, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11493, "t": 261.54822, "r": 322.62866, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 266.61339999999996, "r_x1": 322.62866, "r_y1": 266.61339999999996, "r_x2": 322.62866, "r_y2": 261.54822, "r_x3": 306.11493, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43222, "t": 261.54822, "r": 400.73563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 266.61339999999996, "r_x1": 400.73563, "r_y1": 266.61339999999996, "r_x2": 400.73563, "r_y2": 261.54822, "r_x3": 394.43222, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73456, "t": 261.54822, "r": 403.73697, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 266.61339999999996, "r_x1": 403.73697, "r_y1": 266.61339999999996, "r_x2": 403.73697, "r_y2": 261.54822, "r_x3": 400.73456, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.73804, "t": 261.54822, "r": 405.53625, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 266.61339999999996, "r_x1": 405.53625, "r_y1": 266.61339999999996, "r_x2": 405.53625, "r_y2": 261.54822, "r_x3": 403.73804, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7016, "t": 261.54822, "r": 438.80563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7016, "r_y0": 266.61339999999996, "r_x1": 438.80563, "r_y1": 266.61339999999996, "r_x2": 438.80563, "r_y2": 261.54822, "r_x3": 427.7016, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.55533, "t": 261.54822, "r": 482.07043, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.55533, "r_y0": 266.61339999999996, "r_x1": 482.07043, "r_y1": 266.61339999999996, "r_x2": 482.07043, "r_y2": 261.54822, "r_x3": 468.55533, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.01862, "t": 261.54822, "r": 529.53375, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 266.61339999999996, "r_x1": 529.53375, "r_y1": 266.61339999999996, "r_x2": 529.53375, "r_y2": 261.54822, "r_x3": 516.01862, "r_y3": 261.54822, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11493, "t": 269.64148, "r": 356.24771, "b": 274.70667000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 274.70667000000003, "r_x1": 356.24771, "r_y1": 274.70667000000003, "r_x2": 356.24771, "r_y2": 269.64148, "r_x3": 306.11493, "r_y3": 269.64148, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43222, "t": 270.31946000000005, "r": 400.73563, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43222, "r_y0": 275.38464, "r_x1": 400.73563, "r_y1": 275.38464, "r_x2": 400.73563, "r_y2": 270.31946000000005, "r_x3": 394.43222, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73456, "t": 270.31946000000005, "r": 403.73697, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73456, "r_y0": 275.38464, "r_x1": 403.73697, "r_y1": 275.38464, "r_x2": 403.73697, "r_y2": 270.31946000000005, "r_x3": 400.73456, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.73804, "t": 270.31946000000005, "r": 405.53625, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.73804, "r_y0": 275.38464, "r_x1": 405.53625, "r_y1": 275.38464, "r_x2": 405.53625, "r_y2": 270.31946000000005, "r_x3": 403.73804, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.02802, "t": 270.31946000000005, "r": 436.4280099999999, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.02802, "r_y0": 275.38464, "r_x1": 436.4280099999999, "r_y1": 275.38464, "r_x2": 436.4280099999999, "r_y2": 270.31946000000005, "r_x3": 431.02802, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83099000000004, "t": 270.31946000000005, "r": 482.35013, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83099000000004, "r_y0": 275.38464, "r_x1": 482.35013, "r_y1": 275.38464, "r_x2": 482.35013, "r_y2": 270.31946000000005, "r_x3": 465.83099000000004, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.01862, "t": 270.31946000000005, "r": 529.53375, "b": 275.38464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.01862, "r_y0": 275.38464, "r_x1": 529.53375, "r_y1": 275.38464, "r_x2": 529.53375, "r_y2": 270.31946000000005, "r_x3": 516.01862, "r_y3": 270.31946000000005, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11493, "t": 278.48572, "r": 373.35764, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11493, "r_y0": 283.55092999999994, "r_x1": 373.35764, "r_y1": 283.55092999999994, "r_x2": 373.35764, "r_y2": 278.48572, "r_x3": 306.11493, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.24661, "t": 278.48572, "r": 403.75531, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.24661, "r_y0": 283.55092999999994, "r_x1": 403.75531, "r_y1": 283.55092999999994, "r_x2": 403.75531, "r_y2": 278.48572, "r_x3": 396.24661, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.51599, "t": 278.48572, "r": 437.02469, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.51599, "r_y0": 283.55092999999994, "r_x1": 437.02469, "r_y1": 283.55092999999994, "r_x2": 437.02469, "r_y2": 278.48572, "r_x3": 429.51599, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.7142, "t": 278.48572, "r": 484.73965000000004, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.7142, "r_y0": 283.55092999999994, "r_x1": 484.73965000000004, "r_y1": 283.55092999999994, "r_x2": 484.73965000000004, "r_y2": 278.48572, "r_x3": 463.7142, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99463, "t": 278.48572, "r": 534.02008, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99463, "r_y0": 283.55092999999994, "r_x1": 534.02008, "r_y1": 283.55092999999994, "r_x2": 534.02008, "r_y2": 278.48572, "r_x3": 512.99463, "r_y3": 278.48572, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 459.04861, "t": 221.62415, "r": 542.00018, "b": 226.68933000000004, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 393.2442, "t": 236.74712999999997, "r": 400.74588, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RS U s", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 392.09671, "t": 221.57446000000004, "r": 438.0145, "b": 226.63964999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.18323, "t": 236.74712999999997, "r": 440.98778999999996, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 468.38254, "t": 236.74712999999997, "r": 482.48465000000004, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 516.92578, "t": 236.74712999999997, "r": 530.73035, "b": 241.81232, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 244.61084000000005, "r": 355.6532, "b": 249.67602999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on Janua ry 1", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 244.91327, "r": 400.75238, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1. 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.81838999999997, "t": 244.91327, "r": 437.32708999999994, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.52859, "t": 244.91327, "r": 478.40103, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.44824, "t": 244.91327, "r": 531.46967, "b": 249.97844999999995, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 253.68451000000005, "r": 325.62674, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 253.68451000000005, "r": 400.75238, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0. 5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.81838999999997, "t": 253.68451000000005, "r": 437.32708999999994, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 466.43579000000005, "t": 253.68451000000005, "r": 482.54831, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 514.29065, "t": 253.68451000000005, "r": 530.80981, "b": 258.74969, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 261.54822, "r": 322.62866, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43222, "t": 261.54822, "r": 400.73563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 5 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 427.7016, "t": 261.54822, "r": 438.80563, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 468.55533, "t": 261.54822, "r": 482.07043, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.01862, "t": 261.54822, "r": 529.53375, "b": 266.61339999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 269.64148, "r": 356.24771, "b": 274.70667000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43222, "t": 270.31946000000005, "r": 400.73563, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 1 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 431.02802, "t": 270.31946000000005, "r": 436.4280099999999, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.83099000000004, "t": 270.31946000000005, "r": 482.35013, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.01862, "t": 270.31946000000005, "r": 529.53375, "b": 275.38464, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11493, "t": 278.48572, "r": 373.35764, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.24661, "t": 278.48572, "r": 403.75531, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.51599, "t": 278.48572, "r": 437.02469, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 463.7142, "t": 278.48572, "r": 484.73965000000004, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.99463, "t": 278.48572, "r": 534.02008, "b": 283.55092999999994, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.112, "t": 320.87735, "r": 545.11377, "b": 365.64987, "coord_origin": "TOPLEFT" }, "confidence": 0.9140303134918213, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 329.78391, "r_x1": 86.864021, "r_y1": 329.78391, "r_x2": 86.864021, "r_y2": 320.87735, "r_x3": 50.112, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.917542, "r_y0": 329.78391, "r_x1": 545.11371, "r_y1": 329.78391, "r_x2": 545.11371, "r_y2": 320.87735, "r_x3": 93.917542, "r_y3": 320.87735, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 341.73889, "r_x1": 545.11371, "r_y1": 341.73889, "r_x2": 545.11371, "r_y2": 332.83233999999993, "r_x3": 50.112, "r_y3": 332.83233999999993, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 353.69388, "r_x1": 545.11377, "r_y1": 353.69388, "r_x2": 545.11377, "r_y2": 344.78732, "r_x3": 50.112, "r_y3": 344.78732, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.64987, "r_x1": 139.79532, "r_y1": 365.64987, "r_x2": 139.79532, "r_y2": 356.74332, "r_x3": 50.112, "r_y3": 356.74332, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset." }, { "label": "picture", "id": 12, "page_no": 7, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT" }, "confidence": 0.805853009223938, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26282, "r_y0": 386.44281, "r_x1": 342.07819, "r_y1": 386.44281, "r_x2": 342.07819, "r_y2": 381.77722, "r_x3": 220.26282, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 167, "label": "text", "bbox": { "l": 220.26282, "t": 381.77722, "r": 342.07819, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26282, "r_y0": 386.44281, "r_x1": 342.07819, "r_y1": 386.44281, "r_x2": 342.07819, "r_y2": 381.77722, "r_x3": 220.26282, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 11, "page_no": 7, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT" }, "confidence": 0.8308426737785339, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.715248, "r_y0": 386.44281, "r_x1": 85.657333, "r_y1": 386.44281, "r_x2": 85.657333, "r_y2": 381.77722, "r_x3": 53.715248, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 168, "label": "text", "bbox": { "l": 53.715248, "t": 381.77722, "r": 85.657333, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.715248, "r_y0": 386.44281, "r_x1": 85.657333, "r_y1": 386.44281, "r_x2": 85.657333, "r_y2": 381.77722, "r_x3": 53.715248, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 13, "page_no": 7, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT" }, "confidence": 0.7881615161895752, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 406.87158, "r_x1": 443.69870000000003, "r_y1": 406.87158, "r_x2": 443.69870000000003, "r_y2": 400.55295, "r_x3": 437.37939, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 406.87158, "r_x1": 456.6513100000001, "r_y1": 406.87158, "r_x2": 456.6513100000001, "r_y2": 400.55295, "r_x3": 450.33203, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 406.87158, "r_x1": 469.60394, "r_y1": 406.87158, "r_x2": 469.60394, "r_y2": 400.55295, "r_x3": 463.28464, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23724000000004, "r_y0": 406.87158, "r_x1": 482.5565500000001, "r_y1": 406.87158, "r_x2": 482.5565500000001, "r_y2": 400.55295, "r_x3": 476.23724000000004, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18988, "r_y0": 406.87158, "r_x1": 495.50916, "r_y1": 406.87158, "r_x2": 495.50916, "r_y2": 400.55295, "r_x3": 489.18988, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14251999999993, "r_y0": 406.87158, "r_x1": 508.46178999999995, "r_y1": 406.87158, "r_x2": 508.46178999999995, "r_y2": 400.55295, "r_x3": 502.14251999999993, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09509, "r_y0": 406.87158, "r_x1": 521.41443, "r_y1": 406.87158, "r_x2": 521.41443, "r_y2": 400.55295, "r_x3": 515.09509, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 417.35699, "r_x1": 391.60071, "r_y1": 417.35699, "r_x2": 391.60071, "r_y2": 411.03836000000007, "r_x3": 385.2814, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 417.35699, "r_x1": 404.84271, "r_y1": 417.35699, "r_x2": 404.84271, "r_y2": 411.03836000000007, "r_x3": 398.52341, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 417.35699, "r_x1": 417.79535, "r_y1": 417.35699, "r_x2": 417.79535, "r_y2": 411.03836000000007, "r_x3": 411.47604, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 417.35699, "r_x1": 443.69870000000003, "r_y1": 417.35699, "r_x2": 443.69870000000003, "r_y2": 411.03836000000007, "r_x3": 437.37939, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 417.35699, "r_x1": 456.6513100000001, "r_y1": 417.35699, "r_x2": 456.6513100000001, "r_y2": 411.03836000000007, "r_x3": 450.33203, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 417.35699, "r_x1": 469.60394, "r_y1": 417.35699, "r_x2": 469.60394, "r_y2": 411.03836000000007, "r_x3": 463.28464, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 427.38834, "r_x1": 391.60071, "r_y1": 427.38834, "r_x2": 391.60071, "r_y2": 421.0697, "r_x3": 385.2814, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 427.38834, "r_x1": 404.84271, "r_y1": 427.38834, "r_x2": 404.84271, "r_y2": 421.0697, "r_x3": 398.52341, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 427.38834, "r_x1": 417.79532, "r_y1": 427.38834, "r_x2": 417.79532, "r_y2": 421.0697, "r_x3": 411.47604, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 427.38834, "r_x1": 430.74796, "r_y1": 427.38834, "r_x2": 430.74796, "r_y2": 421.0697, "r_x3": 424.42865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 427.38834, "r_x1": 443.70056, "r_y1": 427.38834, "r_x2": 443.70056, "r_y2": 421.0697, "r_x3": 437.38129, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 427.38834, "r_x1": 456.65319999999997, "r_y1": 427.38834, "r_x2": 456.65319999999997, "r_y2": 421.0697, "r_x3": 450.33389000000005, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 427.38834, "r_x1": 469.6058, "r_y1": 427.38834, "r_x2": 469.6058, "r_y2": 421.0697, "r_x3": 463.2865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 427.38834, "r_x1": 482.55841, "r_y1": 427.38834, "r_x2": 482.55841, "r_y2": 421.0697, "r_x3": 476.23914, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 427.38834, "r_x1": 495.51105, "r_y1": 427.38834, "r_x2": 495.51105, "r_y2": 421.0697, "r_x3": 489.1917700000001, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 427.38834, "r_x1": 508.46368, "r_y1": 427.38834, "r_x2": 508.46368, "r_y2": 421.0697, "r_x3": 502.14438, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 427.38834, "r_x1": 521.41632, "r_y1": 427.38834, "r_x2": 521.41632, "r_y2": 421.0697, "r_x3": 515.09705, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 427.38834, "r_x1": 534.3689, "r_y1": 427.38834, "r_x2": 534.3689, "r_y2": 421.0697, "r_x3": 528.04962, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 438.36295, "r_x1": 391.60071, "r_y1": 438.36295, "r_x2": 391.60071, "r_y2": 432.04431, "r_x3": 385.2814, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 438.36295, "r_x1": 404.84271, "r_y1": 438.36295, "r_x2": 404.84271, "r_y2": 432.04431, "r_x3": 398.52341, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 438.36295, "r_x1": 417.79532, "r_y1": 438.36295, "r_x2": 417.79532, "r_y2": 432.04431, "r_x3": 411.47604, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 438.36295, "r_x1": 430.74796, "r_y1": 438.36295, "r_x2": 430.74796, "r_y2": 432.04431, "r_x3": 424.42865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 438.36295, "r_x1": 443.70056, "r_y1": 438.36295, "r_x2": 443.70056, "r_y2": 432.04431, "r_x3": 437.38129, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 438.36295, "r_x1": 456.65319999999997, "r_y1": 438.36295, "r_x2": 456.65319999999997, "r_y2": 432.04431, "r_x3": 450.33389000000005, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 438.36295, "r_x1": 469.6058, "r_y1": 438.36295, "r_x2": 469.6058, "r_y2": 432.04431, "r_x3": 463.2865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 438.36295, "r_x1": 482.55841, "r_y1": 438.36295, "r_x2": 482.55841, "r_y2": 432.04431, "r_x3": 476.23914, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 438.36295, "r_x1": 495.51105, "r_y1": 438.36295, "r_x2": 495.51105, "r_y2": 432.04431, "r_x3": 489.1917700000001, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 438.36295, "r_x1": 508.46368, "r_y1": 438.36295, "r_x2": 508.46368, "r_y2": 432.04431, "r_x3": 502.14438, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 438.36295, "r_x1": 521.41632, "r_y1": 438.36295, "r_x2": 521.41632, "r_y2": 432.04431, "r_x3": 515.09705, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 438.36295, "r_x1": 534.3689, "r_y1": 438.36295, "r_x2": 534.3689, "r_y2": 432.04431, "r_x3": 528.04962, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 395.51868, "r_x1": 388.44073, "r_y1": 395.51868, "r_x2": 388.44073, "r_y2": 389.20004, "r_x3": 385.2814, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 395.51868, "r_x1": 401.68274, "r_y1": 395.51868, "r_x2": 401.68274, "r_y2": 389.20004, "r_x3": 398.52341, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.4754, "r_y0": 395.51868, "r_x1": 414.63474, "r_y1": 395.51868, "r_x2": 414.63474, "r_y2": 389.20004, "r_x3": 411.4754, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.4274, "r_y0": 395.51868, "r_x1": 427.58673, "r_y1": 395.51868, "r_x2": 427.58673, "r_y2": 389.20004, "r_x3": 424.4274, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 395.51868, "r_x1": 440.53870000000006, "r_y1": 395.51868, "r_x2": 440.53870000000006, "r_y2": 389.20004, "r_x3": 437.37939, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33136, "r_y0": 395.51868, "r_x1": 453.49069000000003, "r_y1": 395.51868, "r_x2": 453.49069000000003, "r_y2": 389.20004, "r_x3": 450.33136, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28336, "r_y0": 395.51868, "r_x1": 466.44269, "r_y1": 395.51868, "r_x2": 466.44269, "r_y2": 389.20004, "r_x3": 463.28336, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23535, "r_y0": 395.51868, "r_x1": 479.39468, "r_y1": 395.51868, "r_x2": 479.39468, "r_y2": 389.20004, "r_x3": 476.23535, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18735, "r_y0": 395.51868, "r_x1": 492.34668, "r_y1": 395.51868, "r_x2": 492.34668, "r_y2": 389.20004, "r_x3": 489.18735, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.13933999999995, "r_y0": 395.51868, "r_x1": 505.29868000000005, "r_y1": 395.51868, "r_x2": 505.29868000000005, "r_y2": 389.20004, "r_x3": 502.13933999999995, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09131, "r_y0": 395.51868, "r_x1": 521.41064, "r_y1": 395.51868, "r_x2": 521.41064, "r_y2": 389.20004, "r_x3": 515.09131, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04364, "r_y0": 395.51868, "r_x1": 534.13104, "r_y1": 395.51868, "r_x2": 534.13104, "r_y2": 389.20004, "r_x3": 528.04364, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 405.29327, "r_x1": 391.60071, "r_y1": 405.29327, "r_x2": 391.60071, "r_y2": 398.97464, "r_x3": 385.2814, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 405.29327, "r_x1": 404.84271, "r_y1": 405.29327, "r_x2": 404.84271, "r_y2": 398.97464, "r_x3": 398.52341, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 405.29327, "r_x1": 417.79535, "r_y1": 405.29327, "r_x2": 417.79535, "r_y2": 398.97464, "r_x3": 411.47604, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42719, "r_y0": 413.09326, "r_x1": 430.74648999999994, "r_y1": 413.09326, "r_x2": 430.74648999999994, "r_y2": 406.77463000000006, "r_x3": 424.42719, "r_y3": 406.77463000000006, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.86941999999993, "r_y0": 417.31302, "r_x1": 509.18871999999993, "r_y1": 417.31302, "r_x2": 509.18871999999993, "r_y2": 410.99438, "r_x3": 502.86941999999993, "r_y3": 410.99438, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35437, "r_y0": 386.44281, "r_x1": 430.99261, "r_y1": 386.44281, "r_x2": 430.99261, "r_y2": 381.77722, "r_x3": 384.35437, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 169, "label": "text", "bbox": { "l": 437.37939, "t": 400.55295, "r": 443.69870000000003, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 406.87158, "r_x1": 443.69870000000003, "r_y1": 406.87158, "r_x2": 443.69870000000003, "r_y2": 400.55295, "r_x3": 437.37939, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 170, "label": "text", "bbox": { "l": 450.33203, "t": 400.55295, "r": 456.6513100000001, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 406.87158, "r_x1": 456.6513100000001, "r_y1": 406.87158, "r_x2": 456.6513100000001, "r_y2": 400.55295, "r_x3": 450.33203, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 171, "label": "text", "bbox": { "l": 463.28464, "t": 400.55295, "r": 469.60394, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 406.87158, "r_x1": 469.60394, "r_y1": 406.87158, "r_x2": 469.60394, "r_y2": 400.55295, "r_x3": 463.28464, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 172, "label": "text", "bbox": { "l": 476.23724000000004, "t": 400.55295, "r": 482.5565500000001, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23724000000004, "r_y0": 406.87158, "r_x1": 482.5565500000001, "r_y1": 406.87158, "r_x2": 482.5565500000001, "r_y2": 400.55295, "r_x3": 476.23724000000004, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 173, "label": "text", "bbox": { "l": 489.18988, "t": 400.55295, "r": 495.50916, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18988, "r_y0": 406.87158, "r_x1": 495.50916, "r_y1": 406.87158, "r_x2": 495.50916, "r_y2": 400.55295, "r_x3": 489.18988, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 174, "label": "text", "bbox": { "l": 502.14251999999993, "t": 400.55295, "r": 508.46178999999995, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14251999999993, "r_y0": 406.87158, "r_x1": 508.46178999999995, "r_y1": 406.87158, "r_x2": 508.46178999999995, "r_y2": 400.55295, "r_x3": 502.14251999999993, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 175, "label": "text", "bbox": { "l": 515.09509, "t": 400.55295, "r": 521.41443, "b": 406.87158, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09509, "r_y0": 406.87158, "r_x1": 521.41443, "r_y1": 406.87158, "r_x2": 521.41443, "r_y2": 400.55295, "r_x3": 515.09509, "r_y3": 400.55295, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 176, "label": "text", "bbox": { "l": 385.2814, "t": 411.03836000000007, "r": 391.60071, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 417.35699, "r_x1": 391.60071, "r_y1": 417.35699, "r_x2": 391.60071, "r_y2": 411.03836000000007, "r_x3": 385.2814, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 177, "label": "text", "bbox": { "l": 398.52341, "t": 411.03836000000007, "r": 404.84271, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 417.35699, "r_x1": 404.84271, "r_y1": 417.35699, "r_x2": 404.84271, "r_y2": 411.03836000000007, "r_x3": 398.52341, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 178, "label": "text", "bbox": { "l": 411.47604, "t": 411.03836000000007, "r": 417.79535, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 417.35699, "r_x1": 417.79535, "r_y1": 417.35699, "r_x2": 417.79535, "r_y2": 411.03836000000007, "r_x3": 411.47604, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 179, "label": "text", "bbox": { "l": 437.37939, "t": 411.03836000000007, "r": 443.69870000000003, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 417.35699, "r_x1": 443.69870000000003, "r_y1": 417.35699, "r_x2": 443.69870000000003, "r_y2": 411.03836000000007, "r_x3": 437.37939, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 180, "label": "text", "bbox": { "l": 450.33203, "t": 411.03836000000007, "r": 456.6513100000001, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33203, "r_y0": 417.35699, "r_x1": 456.6513100000001, "r_y1": 417.35699, "r_x2": 456.6513100000001, "r_y2": 411.03836000000007, "r_x3": 450.33203, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 181, "label": "text", "bbox": { "l": 463.28464, "t": 411.03836000000007, "r": 469.60394, "b": 417.35699, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28464, "r_y0": 417.35699, "r_x1": 469.60394, "r_y1": 417.35699, "r_x2": 469.60394, "r_y2": 411.03836000000007, "r_x3": 463.28464, "r_y3": 411.03836000000007, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 182, "label": "text", "bbox": { "l": 385.2814, "t": 421.0697, "r": 391.60071, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 427.38834, "r_x1": 391.60071, "r_y1": 427.38834, "r_x2": 391.60071, "r_y2": 421.0697, "r_x3": 385.2814, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 183, "label": "text", "bbox": { "l": 398.52341, "t": 421.0697, "r": 404.84271, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 427.38834, "r_x1": 404.84271, "r_y1": 427.38834, "r_x2": 404.84271, "r_y2": 421.0697, "r_x3": 398.52341, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 184, "label": "text", "bbox": { "l": 411.47604, "t": 421.0697, "r": 417.79532, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 427.38834, "r_x1": 417.79532, "r_y1": 427.38834, "r_x2": 417.79532, "r_y2": 421.0697, "r_x3": 411.47604, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 185, "label": "text", "bbox": { "l": 424.42865, "t": 421.0697, "r": 430.74796, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 427.38834, "r_x1": 430.74796, "r_y1": 427.38834, "r_x2": 430.74796, "r_y2": 421.0697, "r_x3": 424.42865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 186, "label": "text", "bbox": { "l": 437.38129, "t": 421.0697, "r": 443.70056, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 427.38834, "r_x1": 443.70056, "r_y1": 427.38834, "r_x2": 443.70056, "r_y2": 421.0697, "r_x3": 437.38129, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 187, "label": "text", "bbox": { "l": 450.33389000000005, "t": 421.0697, "r": 456.65319999999997, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 427.38834, "r_x1": 456.65319999999997, "r_y1": 427.38834, "r_x2": 456.65319999999997, "r_y2": 421.0697, "r_x3": 450.33389000000005, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 188, "label": "text", "bbox": { "l": 463.2865, "t": 421.0697, "r": 469.6058, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 427.38834, "r_x1": 469.6058, "r_y1": 427.38834, "r_x2": 469.6058, "r_y2": 421.0697, "r_x3": 463.2865, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 189, "label": "text", "bbox": { "l": 476.23914, "t": 421.0697, "r": 482.55841, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 427.38834, "r_x1": 482.55841, "r_y1": 427.38834, "r_x2": 482.55841, "r_y2": 421.0697, "r_x3": 476.23914, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 190, "label": "text", "bbox": { "l": 489.1917700000001, "t": 421.0697, "r": 495.51105, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 427.38834, "r_x1": 495.51105, "r_y1": 427.38834, "r_x2": 495.51105, "r_y2": 421.0697, "r_x3": 489.1917700000001, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 191, "label": "text", "bbox": { "l": 502.14438, "t": 421.0697, "r": 508.46368, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 427.38834, "r_x1": 508.46368, "r_y1": 427.38834, "r_x2": 508.46368, "r_y2": 421.0697, "r_x3": 502.14438, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 192, "label": "text", "bbox": { "l": 515.09705, "t": 421.0697, "r": 521.41632, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 427.38834, "r_x1": 521.41632, "r_y1": 427.38834, "r_x2": 521.41632, "r_y2": 421.0697, "r_x3": 515.09705, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 193, "label": "text", "bbox": { "l": 528.04962, "t": 421.0697, "r": 534.3689, "b": 427.38834, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 427.38834, "r_x1": 534.3689, "r_y1": 427.38834, "r_x2": 534.3689, "r_y2": 421.0697, "r_x3": 528.04962, "r_y3": 421.0697, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 194, "label": "text", "bbox": { "l": 385.2814, "t": 432.04431, "r": 391.60071, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 438.36295, "r_x1": 391.60071, "r_y1": 438.36295, "r_x2": 391.60071, "r_y2": 432.04431, "r_x3": 385.2814, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 195, "label": "text", "bbox": { "l": 398.52341, "t": 432.04431, "r": 404.84271, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 438.36295, "r_x1": 404.84271, "r_y1": 438.36295, "r_x2": 404.84271, "r_y2": 432.04431, "r_x3": 398.52341, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 196, "label": "text", "bbox": { "l": 411.47604, "t": 432.04431, "r": 417.79532, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 438.36295, "r_x1": 417.79532, "r_y1": 438.36295, "r_x2": 417.79532, "r_y2": 432.04431, "r_x3": 411.47604, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 197, "label": "text", "bbox": { "l": 424.42865, "t": 432.04431, "r": 430.74796, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42865, "r_y0": 438.36295, "r_x1": 430.74796, "r_y1": 438.36295, "r_x2": 430.74796, "r_y2": 432.04431, "r_x3": 424.42865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 198, "label": "text", "bbox": { "l": 437.38129, "t": 432.04431, "r": 443.70056, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38129, "r_y0": 438.36295, "r_x1": 443.70056, "r_y1": 438.36295, "r_x2": 443.70056, "r_y2": 432.04431, "r_x3": 437.38129, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 199, "label": "text", "bbox": { "l": 450.33389000000005, "t": 432.04431, "r": 456.65319999999997, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33389000000005, "r_y0": 438.36295, "r_x1": 456.65319999999997, "r_y1": 438.36295, "r_x2": 456.65319999999997, "r_y2": 432.04431, "r_x3": 450.33389000000005, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 200, "label": "text", "bbox": { "l": 463.2865, "t": 432.04431, "r": 469.6058, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.2865, "r_y0": 438.36295, "r_x1": 469.6058, "r_y1": 438.36295, "r_x2": 469.6058, "r_y2": 432.04431, "r_x3": 463.2865, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 201, "label": "text", "bbox": { "l": 476.23914, "t": 432.04431, "r": 482.55841, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23914, "r_y0": 438.36295, "r_x1": 482.55841, "r_y1": 438.36295, "r_x2": 482.55841, "r_y2": 432.04431, "r_x3": 476.23914, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 202, "label": "text", "bbox": { "l": 489.1917700000001, "t": 432.04431, "r": 495.51105, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.1917700000001, "r_y0": 438.36295, "r_x1": 495.51105, "r_y1": 438.36295, "r_x2": 495.51105, "r_y2": 432.04431, "r_x3": 489.1917700000001, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 203, "label": "text", "bbox": { "l": 502.14438, "t": 432.04431, "r": 508.46368, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14438, "r_y0": 438.36295, "r_x1": 508.46368, "r_y1": 438.36295, "r_x2": 508.46368, "r_y2": 432.04431, "r_x3": 502.14438, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 204, "label": "text", "bbox": { "l": 515.09705, "t": 432.04431, "r": 521.41632, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09705, "r_y0": 438.36295, "r_x1": 521.41632, "r_y1": 438.36295, "r_x2": 521.41632, "r_y2": 432.04431, "r_x3": 515.09705, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 205, "label": "text", "bbox": { "l": 528.04962, "t": 432.04431, "r": 534.3689, "b": 438.36295, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04962, "r_y0": 438.36295, "r_x1": 534.3689, "r_y1": 438.36295, "r_x2": 534.3689, "r_y2": 432.04431, "r_x3": 528.04962, "r_y3": 432.04431, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 206, "label": "text", "bbox": { "l": 385.2814, "t": 389.20004, "r": 388.44073, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 395.51868, "r_x1": 388.44073, "r_y1": 395.51868, "r_x2": 388.44073, "r_y2": 389.20004, "r_x3": 385.2814, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 207, "label": "text", "bbox": { "l": 398.52341, "t": 389.20004, "r": 401.68274, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 395.51868, "r_x1": 401.68274, "r_y1": 395.51868, "r_x2": 401.68274, "r_y2": 389.20004, "r_x3": 398.52341, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 208, "label": "text", "bbox": { "l": 411.4754, "t": 389.20004, "r": 414.63474, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.4754, "r_y0": 395.51868, "r_x1": 414.63474, "r_y1": 395.51868, "r_x2": 414.63474, "r_y2": 389.20004, "r_x3": 411.4754, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 209, "label": "text", "bbox": { "l": 424.4274, "t": 389.20004, "r": 427.58673, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.4274, "r_y0": 395.51868, "r_x1": 427.58673, "r_y1": 395.51868, "r_x2": 427.58673, "r_y2": 389.20004, "r_x3": 424.4274, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 210, "label": "text", "bbox": { "l": 437.37939, "t": 389.20004, "r": 440.53870000000006, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.37939, "r_y0": 395.51868, "r_x1": 440.53870000000006, "r_y1": 395.51868, "r_x2": 440.53870000000006, "r_y2": 389.20004, "r_x3": 437.37939, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 211, "label": "text", "bbox": { "l": 450.33136, "t": 389.20004, "r": 453.49069000000003, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33136, "r_y0": 395.51868, "r_x1": 453.49069000000003, "r_y1": 395.51868, "r_x2": 453.49069000000003, "r_y2": 389.20004, "r_x3": 450.33136, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 212, "label": "text", "bbox": { "l": 463.28336, "t": 389.20004, "r": 466.44269, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28336, "r_y0": 395.51868, "r_x1": 466.44269, "r_y1": 395.51868, "r_x2": 466.44269, "r_y2": 389.20004, "r_x3": 463.28336, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 213, "label": "text", "bbox": { "l": 476.23535, "t": 389.20004, "r": 479.39468, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.23535, "r_y0": 395.51868, "r_x1": 479.39468, "r_y1": 395.51868, "r_x2": 479.39468, "r_y2": 389.20004, "r_x3": 476.23535, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 214, "label": "text", "bbox": { "l": 489.18735, "t": 389.20004, "r": 492.34668, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.18735, "r_y0": 395.51868, "r_x1": 492.34668, "r_y1": 395.51868, "r_x2": 492.34668, "r_y2": 389.20004, "r_x3": 489.18735, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 215, "label": "text", "bbox": { "l": 502.13933999999995, "t": 389.20004, "r": 505.29868000000005, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.13933999999995, "r_y0": 395.51868, "r_x1": 505.29868000000005, "r_y1": 395.51868, "r_x2": 505.29868000000005, "r_y2": 389.20004, "r_x3": 502.13933999999995, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 216, "label": "text", "bbox": { "l": 515.09131, "t": 389.20004, "r": 521.41064, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09131, "r_y0": 395.51868, "r_x1": 521.41064, "r_y1": 395.51868, "r_x2": 521.41064, "r_y2": 389.20004, "r_x3": 515.09131, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 217, "label": "text", "bbox": { "l": 528.04364, "t": 389.20004, "r": 534.13104, "b": 395.51868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04364, "r_y0": 395.51868, "r_x1": 534.13104, "r_y1": 395.51868, "r_x2": 534.13104, "r_y2": 389.20004, "r_x3": 528.04364, "r_y3": 389.20004, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 218, "label": "text", "bbox": { "l": 385.2814, "t": 398.97464, "r": 391.60071, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.2814, "r_y0": 405.29327, "r_x1": 391.60071, "r_y1": 405.29327, "r_x2": 391.60071, "r_y2": 398.97464, "r_x3": 385.2814, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 219, "label": "text", "bbox": { "l": 398.52341, "t": 398.97464, "r": 404.84271, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52341, "r_y0": 405.29327, "r_x1": 404.84271, "r_y1": 405.29327, "r_x2": 404.84271, "r_y2": 398.97464, "r_x3": 398.52341, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 220, "label": "text", "bbox": { "l": 411.47604, "t": 398.97464, "r": 417.79535, "b": 405.29327, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.47604, "r_y0": 405.29327, "r_x1": 417.79535, "r_y1": 405.29327, "r_x2": 417.79535, "r_y2": 398.97464, "r_x3": 411.47604, "r_y3": 398.97464, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 221, "label": "text", "bbox": { "l": 424.42719, "t": 406.77463000000006, "r": 430.74648999999994, "b": 413.09326, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.42719, "r_y0": 413.09326, "r_x1": 430.74648999999994, "r_y1": 413.09326, "r_x2": 430.74648999999994, "r_y2": 406.77463000000006, "r_x3": 424.42719, "r_y3": 406.77463000000006, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 222, "label": "text", "bbox": { "l": 502.86941999999993, "t": 410.99438, "r": 509.18871999999993, "b": 417.31302, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.86941999999993, "r_y0": 417.31302, "r_x1": 509.18871999999993, "r_y1": 417.31302, "r_x2": 509.18871999999993, "r_y2": 410.99438, "r_x3": 502.86941999999993, "r_y3": 410.99438, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 223, "label": "text", "bbox": { "l": 384.35437, "t": 381.77722, "r": 430.99261, "b": 386.44281, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35437, "r_y0": 386.44281, "r_x1": 430.99261, "r_y1": 386.44281, "r_x2": 430.99261, "r_y2": 381.77722, "r_x3": 384.35437, "r_y3": 381.77722, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 62.595001, "t": 458.72836, "r": 532.63049, "b": 467.63492, "coord_origin": "TOPLEFT" }, "confidence": 0.9153602719306946, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.595001, "r_y0": 467.63492, "r_x1": 532.63049, "r_y1": 467.63492, "r_x2": 532.63049, "r_y2": 458.72836, "r_x3": 62.595001, "r_y3": 458.72836, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 50.112, "t": 491.39536, "r": 163.7558, "b": 501.24741, "coord_origin": "TOPLEFT" }, "confidence": 0.9561247229576111, "cells": [ { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 501.24741, "r_x1": 64.448898, "r_y1": 501.24741, "r_x2": 64.448898, "r_y2": 491.39536, "r_x3": 50.112, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.006828, "r_y0": 501.24741, "r_x1": 163.7558, "r_y1": 501.24741, "r_x2": 163.7558, "r_y2": 491.39536, "r_x3": 74.006828, "r_y3": 491.39536, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.5. Qualitative Analysis" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 536.87337, "r": 286.36511, "b": 713.1519470000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9852361679077148, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 545.77992, "r_x1": 286.36499, "r_y1": 545.77992, "r_x2": 286.36499, "r_y2": 536.87337, "r_x3": 62.067001, "r_y3": 536.87337, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 557.73492, "r_x1": 211.15741, "r_y1": 557.73492, "r_x2": 211.15741, "r_y2": 548.82837, "r_x3": 50.112, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.10000999999997, "r_y0": 557.50578, "r_x1": 259.17453, "r_y1": 557.50578, "r_x2": 259.17453, "r_y2": 548.91803, "r_x3": 215.10000999999997, "r_y3": 548.91803, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73492, "r_x1": 286.36273, "r_y1": 557.73492, "r_x2": 286.36273, "r_y2": 548.82837, "r_x3": 263.12, "r_y3": 548.82837, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 569.68993, "r_x1": 286.36505, "r_y1": 569.68993, "r_x2": 286.36505, "r_y2": 560.78337, "r_x3": 50.112, "r_y3": 560.78337, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 581.6449299999999, "r_x1": 286.36508, "r_y1": 581.6449299999999, "r_x2": 286.36508, "r_y2": 572.73837, "r_x3": 50.112, "r_y3": 572.73837, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 593.59993, "r_x1": 286.36508, "r_y1": 593.59993, "r_x2": 286.36508, "r_y2": 584.69337, "r_x3": 50.112, "r_y3": 584.69337, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 605.55592, "r_x1": 286.36505, "r_y1": 605.55592, "r_x2": 286.36505, "r_y2": 596.64937, "r_x3": 50.112, "r_y3": 596.64937, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 617.51093, "r_x1": 286.36508, "r_y1": 617.51093, "r_x2": 286.36508, "r_y2": 608.60437, "r_x3": 50.112, "r_y3": 608.60437, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 629.46593, "r_x1": 286.36508, "r_y1": 629.46593, "r_x2": 286.36508, "r_y2": 620.55937, "r_x3": 50.112, "r_y3": 620.55937, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 641.42093, "r_x1": 286.36508, "r_y1": 641.42093, "r_x2": 286.36508, "r_y2": 632.51437, "r_x3": 50.112, "r_y3": 632.51437, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 653.37593, "r_x1": 286.36508, "r_y1": 653.37593, "r_x2": 286.36508, "r_y2": 644.46938, "r_x3": 50.112, "r_y3": 644.46938, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 665.33094, "r_x1": 286.36511, "r_y1": 665.33094, "r_x2": 286.36511, "r_y2": 656.42438, "r_x3": 50.112, "r_y3": 656.42438, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 677.28694, "r_x1": 286.36508, "r_y1": 677.28694, "r_x2": 286.36508, "r_y2": 668.38037, "r_x3": 50.112, "r_y3": 668.38037, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 689.24194, "r_x1": 286.36511, "r_y1": 689.24194, "r_x2": 286.36511, "r_y2": 680.33537, "r_x3": 50.112, "r_y3": 680.33537, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 701.196945, "r_x1": 286.36511, "r_y1": 701.196945, "r_x2": 286.36511, "r_y2": 692.290375, "r_x3": 50.112, "r_y3": 692.290375, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.1519470000001, "r_x1": 226.88833999999997, "r_y1": 713.1519470000001, "r_x2": 226.88833999999997, "r_y2": 704.245377, "r_x3": 50.112, "r_y3": 704.245377, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type." }, { "label": "section_header", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 308.862, "t": 490.70892, "r": 460.84848, "b": 501.45663, "coord_origin": "TOPLEFT" }, "confidence": 0.9436525702476501, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 501.45663, "r_x1": 316.07382, "r_y1": 501.45663, "r_x2": 316.07382, "r_y2": 490.70892, "r_x3": 308.862, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.68954, "r_y0": 501.45663, "r_x1": 460.84848, "r_y1": 501.45663, "r_x2": 460.84848, "r_y2": 490.70892, "r_x3": 325.68954, "r_y3": 490.70892, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Future Work & Conclusion" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.862, "t": 512.89337, "r": 545.11517, "b": 653.30592, "coord_origin": "TOPLEFT" }, "confidence": 0.9875594973564148, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 521.79993, "r_x1": 545.11505, "r_y1": 521.79993, "r_x2": 545.11505, "r_y2": 512.89337, "r_x3": 320.81699, "r_y3": 512.89337, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 533.75491, "r_x1": 545.11517, "r_y1": 533.75491, "r_x2": 545.11517, "r_y2": 524.84836, "r_x3": 308.862, "r_y3": 524.84836, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.70992, "r_x1": 545.11511, "r_y1": 545.70992, "r_x2": 545.11511, "r_y2": 536.80336, "r_x3": 308.862, "r_y3": 536.80336, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 557.6649199999999, "r_x1": 545.11505, "r_y1": 557.6649199999999, "r_x2": 545.11505, "r_y2": 548.75836, "r_x3": 308.862, "r_y3": 548.75836, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.61992, "r_x1": 545.11517, "r_y1": 569.61992, "r_x2": 545.11517, "r_y2": 560.71336, "r_x3": 308.862, "r_y3": 560.71336, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 581.57492, "r_x1": 545.11511, "r_y1": 581.57492, "r_x2": 545.11511, "r_y2": 572.66837, "r_x3": 308.862, "r_y3": 572.66837, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 593.53091, "r_x1": 545.11511, "r_y1": 593.53091, "r_x2": 545.11511, "r_y2": 584.62436, "r_x3": 308.862, "r_y3": 584.62436, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 605.48592, "r_x1": 400.46808, "r_y1": 605.48592, "r_x2": 400.46808, "r_y2": 596.57936, "r_x3": 308.862, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.37839, "r_y0": 605.48592, "r_x1": 545.11511, "r_y1": 605.48592, "r_x2": 545.11511, "r_y2": 596.57936, "r_x3": 408.37839, "r_y3": 596.57936, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 617.44092, "r_x1": 545.11505, "r_y1": 617.44092, "r_x2": 545.11505, "r_y2": 608.53436, "r_x3": 308.862, "r_y3": 608.53436, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 629.3959199999999, "r_x1": 545.11511, "r_y1": 629.3959199999999, "r_x2": 545.11511, "r_y2": 620.48936, "r_x3": 308.862, "r_y3": 620.48936, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 641.35092, "r_x1": 545.11505, "r_y1": 641.35092, "r_x2": 545.11505, "r_y2": 632.4443699999999, "r_x3": 308.862, "r_y3": 632.4443699999999, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 653.30592, "r_x1": 365.85803, "r_y1": 653.30592, "r_x2": 365.85803, "r_y2": 644.39937, "r_x3": 308.862, "r_y3": 644.39937, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 308.862, "t": 672.09892, "r": 364.40585, "b": 682.84664, "coord_origin": "TOPLEFT" }, "confidence": 0.9442470073699951, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 682.84664, "r_x1": 364.40585, "r_y1": 682.84664, "r_x2": 364.40585, "r_y2": 672.09892, "r_x3": 308.862, "r_y3": 672.09892, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 10, "page_no": 7, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 313.345, "t": 693.9617920000001, "r": 545.1134, "b": 712.936752, "coord_origin": "TOPLEFT" }, "confidence": 0.8318753838539124, "cells": [ { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.345, "r_y0": 701.977753, "r_x1": 323.80792, "r_y1": 701.977753, "r_x2": 323.80792, "r_y2": 693.9617920000001, "r_x3": 313.345, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05127, "r_y0": 701.977753, "r_x1": 545.10852, "r_y1": 701.977753, "r_x2": 545.10852, "r_y2": 693.9617920000001, "r_x3": 326.05127, "r_y3": 693.9617920000001, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 712.936752, "r_x1": 545.1134, "r_y1": 712.936752, "r_x2": 545.1134, "r_y2": 704.920792, "r_x3": 328.78101, "r_y3": 704.920792, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-" }, { "label": "picture", "id": 15, "page_no": 7, "cluster": { "id": 15, "label": "picture", "bbox": { "l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT" }, "confidence": 0.7699173092842102, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 14, "page_no": 7, "cluster": { "id": 14, "label": "picture", "bbox": { "l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT" }, "confidence": 0.7873926162719727, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_footer", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.121, "t": 734.133366, "r": 300.10229, "b": 743.039928, "coord_origin": "TOPLEFT" }, "confidence": 0.8709858059883118, "cells": [ { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.121, "r_y0": 743.039928, "r_x1": 300.10229, "r_y1": 743.039928, "r_x2": 300.10229, "r_y2": 734.133366, "r_x3": 295.121, "r_y3": 734.133366, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" } ] } }, { "page_no": 8, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.89977999999996, "r_x1": 286.36334, "r_y1": 83.89977999999996, "r_x2": 286.36334, "r_y2": 75.88378999999998, "r_x3": 70.030998, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 94.85875999999996, "r_x1": 286.36331, "r_y1": 94.85875999999996, "r_x2": 286.36331, "r_y2": 86.84276999999997, "r_x3": 70.030998, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 105.81677000000002, "r_x1": 85.722198, "r_y1": 105.81677000000002, "r_x2": 85.722198, "r_y2": 97.80078000000003, "r_x3": 70.030998, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.889, "r_y0": 105.61053000000004, "r_x1": 199.93315, "r_y1": 105.61053000000004, "r_x2": 199.93315, "r_y2": 97.88147000000004, "r_x3": 87.889, "r_y3": 97.88147000000004, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.936, "r_y0": 105.81677000000002, "r_x1": 286.36313, "r_y1": 105.81677000000002, "r_x2": 286.36313, "r_y2": 97.80078000000003, "r_x3": 199.936, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 116.77575999999999, "r_x1": 221.94871999999998, "r_y1": 116.77575999999999, "r_x2": 221.94871999999998, "r_y2": 108.75977, "r_x3": 70.031006, "r_y3": 108.75977, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595005, "r_y0": 128.04773, "r_x1": 65.206657, "r_y1": 128.04773, "r_x2": 65.206657, "r_y2": 120.03174000000013, "r_x3": 54.595005, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.481873, "r_y0": 128.04773, "r_x1": 286.35852, "r_y1": 128.04773, "r_x2": 286.35852, "r_y2": 120.03174000000013, "r_x3": 67.481873, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.00671, "r_x1": 179.67215, "r_y1": 139.00671, "r_x2": 179.67215, "r_y2": 130.99072, "r_x3": 70.031006, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58101, "r_y0": 139.00671, "r_x1": 286.36334, "r_y1": 139.00671, "r_x2": 286.36334, "r_y2": 130.99072, "r_x3": 185.58101, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.96569999999997, "r_x1": 113.11456, "r_y1": 149.96569999999997, "r_x2": 113.11456, "r_y2": 141.94970999999998, "r_x3": 70.031006, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34200999999999, "r_y0": 149.75946, "r_x1": 235.3082, "r_y1": 149.75946, "r_x2": 235.3082, "r_y2": 142.0304, "r_x3": 116.34200999999999, "r_y3": 142.0304, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.30701, "r_y0": 149.96569999999997, "r_x1": 267.67572, "r_y1": 149.96569999999997, "r_x2": 267.67572, "r_y2": 141.94970999999998, "r_x3": 235.30701, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 161.23766999999998, "r_x1": 65.103195, "r_y1": 161.23766999999998, "r_x2": 65.103195, "r_y2": 153.22168, "r_x3": 54.595001, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.356239, "r_y0": 161.23766999999998, "r_x1": 218.77876, "r_y1": 161.23766999999998, "r_x2": 218.77876, "r_y2": 153.22168, "r_x3": 67.356239, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.97999999999996, "r_y0": 161.03143, "r_x1": 286.36301, "r_y1": 161.03143, "r_x2": 286.36301, "r_y2": 153.30237, "r_x3": 220.97999999999996, "r_y3": 153.30237, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 171.99041999999997, "r_x1": 125.26401000000001, "r_y1": 171.99041999999997, "r_x2": 125.26401000000001, "r_y2": 164.26135, "r_x3": 70.030991, "r_y3": 164.26135, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26098999999999, "r_y0": 172.19665999999995, "r_x1": 286.36029, "r_y1": 172.19665999999995, "r_x2": 286.36029, "r_y2": 164.18066, "r_x3": 125.26098999999999, "r_y3": 164.18066, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 183.15466000000004, "r_x1": 97.916496, "r_y1": 183.15466000000004, "r_x2": 97.916496, "r_y2": 175.13867000000005, "r_x3": 70.030991, "r_y3": 175.13867000000005, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 194.42664000000002, "r_x1": 65.806984, "r_y1": 194.42664000000002, "r_x2": 65.806984, "r_y2": 186.41063999999994, "r_x3": 54.59499, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.210922, "r_y0": 194.42664000000002, "r_x1": 286.36401, "r_y1": 194.42664000000002, "r_x2": 286.36401, "r_y2": 186.41063999999994, "r_x3": 68.210922, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 205.38562000000002, "r_x1": 286.36331, "r_y1": 205.38562000000002, "r_x2": 286.36331, "r_y2": 197.36963000000003, "r_x3": 70.030983, "r_y3": 197.36963000000003, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 216.3446, "r_x1": 286.36334, "r_y1": 216.3446, "r_x2": 286.36334, "r_y2": 208.32861000000003, "r_x3": 70.030983, "r_y3": 208.32861000000003, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 227.30358999999999, "r_x1": 245.83519, "r_y1": 227.30358999999999, "r_x2": 245.83519, "r_y2": 219.2876, "r_x3": 70.030983, "r_y3": 219.2876, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594982, "r_y0": 238.57556, "r_x1": 65.381134, "r_y1": 238.57556, "r_x2": 65.381134, "r_y2": 230.55957, "r_x3": 54.594982, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693779, "r_y0": 238.57556, "r_x1": 286.35849, "r_y1": 238.57556, "r_x2": 286.35849, "r_y2": 230.55957, "r_x3": 67.693779, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 249.53454999999997, "r_x1": 286.36334, "r_y1": 249.53454999999997, "r_x2": 286.36334, "r_y2": 241.51855, "r_x3": 70.030983, "r_y3": 241.51855, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 260.49255000000005, "r_x1": 108.39821, "r_y1": 260.49255000000005, "r_x2": 108.39821, "r_y2": 252.47655999999995, "r_x3": 70.030983, "r_y3": 252.47655999999995, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64498000000002, "r_y0": 260.28632000000005, "r_x1": 286.3595, "r_y1": 260.28632000000005, "r_x2": 286.3595, "r_y2": 252.55724999999995, "r_x3": 110.64498000000002, "r_y3": 252.55724999999995, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 271.24530000000004, "r_x1": 140.57861, "r_y1": 271.24530000000004, "r_x2": 140.57861, "r_y2": 263.51624000000004, "r_x3": 70.030983, "r_y3": 263.51624000000004, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.57797, "r_y0": 271.45154, "r_x1": 266.47522, "r_y1": 271.45154, "r_x2": 266.47522, "r_y2": 263.43555000000003, "r_x3": 140.57797, "r_y3": 263.43555000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594971, "r_y0": 282.72351, "r_x1": 64.848648, "r_y1": 282.72351, "r_x2": 64.848648, "r_y2": 274.70758, "r_x3": 54.594971, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.047119, "r_y0": 282.72351, "r_x1": 286.36676, "r_y1": 282.72351, "r_x2": 286.36676, "r_y2": 274.70758, "r_x3": 67.047119, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 293.68253, "r_x1": 179.57349, "r_y1": 293.68253, "r_x2": 179.57349, "r_y2": 285.66655999999995, "r_x3": 70.030975, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.01559, "r_y0": 293.68253, "r_x1": 194.4846, "r_y1": 293.68253, "r_x2": 194.4846, "r_y2": 285.66655999999995, "r_x3": 187.01559, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04398, "r_y0": 293.47632, "r_x1": 286.36304, "r_y1": 293.47632, "r_x2": 286.36304, "r_y2": 285.74725, "r_x3": 198.04398, "r_y3": 285.74725, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 304.43530000000004, "r_x1": 260.19937, "r_y1": 304.43530000000004, "r_x2": 260.19937, "r_y2": 296.70624, "r_x3": 70.030975, "r_y3": 296.70624, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.198, "r_y0": 304.64151, "r_x1": 286.36197, "r_y1": 304.64151, "r_x2": 286.36197, "r_y2": 296.62555, "r_x3": 260.198, "r_y3": 296.62555, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 315.6004899999999, "r_x1": 142.74849, "r_y1": 315.6004899999999, "r_x2": 142.74849, "r_y2": 307.5845299999999, "r_x3": 70.030991, "r_y3": 307.5845299999999, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 326.8725, "r_x1": 65.61586, "r_y1": 326.8725, "r_x2": 65.61586, "r_y2": 318.85654, "r_x3": 54.59499, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.978821, "r_y0": 326.8725, "r_x1": 199.492, "r_y1": 326.8725, "r_x2": 199.492, "r_y2": 318.85654, "r_x3": 67.978821, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.98792, "r_y0": 326.8725, "r_x1": 286.35849, "r_y1": 326.8725, "r_x2": 286.35849, "r_y2": 318.85654, "r_x3": 206.98792, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 337.83051, "r_x1": 176.28284, "r_y1": 337.83051, "r_x2": 176.28284, "r_y2": 329.8145400000001, "r_x3": 70.030991, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.60416, "r_y0": 337.83051, "r_x1": 190.07317, "r_y1": 337.83051, "r_x2": 190.07317, "r_y2": 329.8145400000001, "r_x3": 182.60416, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28299, "r_y0": 337.62429999999995, "r_x1": 286.36319, "r_y1": 337.62429999999995, "r_x2": 286.36319, "r_y2": 329.89522999999997, "r_x3": 193.28299, "r_y3": 329.89522999999997, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 348.58331, "r_x1": 206.34717, "r_y1": 348.58331, "r_x2": 206.34717, "r_y2": 340.85425, "r_x3": 70.030991, "r_y3": 340.85425, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.34599, "r_y0": 348.78952, "r_x1": 274.82239, "r_y1": 348.78952, "r_x2": 274.82239, "r_y2": 340.77356, "r_x3": 206.34599, "r_y3": 340.77356, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594986000000006, "r_y0": 360.06152, "r_x1": 65.04657, "r_y1": 360.06152, "r_x2": 65.04657, "r_y2": 352.0455600000001, "r_x3": 54.594986000000006, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.287483, "r_y0": 360.06152, "r_x1": 286.35849, "r_y1": 360.06152, "r_x2": 286.35849, "r_y2": 352.0455600000001, "r_x3": 67.287483, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 371.02054, "r_x1": 234.12507999999997, "r_y1": 371.02054, "r_x2": 234.12507999999997, "r_y2": 363.00458, "r_x3": 70.030983, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05186, "r_y0": 371.02054, "r_x1": 286.36331, "r_y1": 371.02054, "r_x2": 286.36331, "r_y2": 363.00458, "r_x3": 240.05186, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 381.97952, "r_x1": 286.36331, "r_y1": 381.97952, "r_x2": 286.36331, "r_y2": 373.96356, "r_x3": 70.030983, "r_y3": 373.96356, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 392.93851, "r_x1": 286.36331, "r_y1": 392.93851, "r_x2": 286.36331, "r_y2": 384.92255, "r_x3": 70.030983, "r_y3": 384.92255, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 403.89749, "r_x1": 114.57605, "r_y1": 403.89749, "r_x2": 114.57605, "r_y2": 395.88153, "r_x3": 70.030983, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.80399000000001, "r_y0": 403.69128, "r_x1": 186.7287, "r_y1": 403.69128, "r_x2": 186.7287, "r_y2": 395.96222, "r_x3": 117.80399000000001, "r_y3": 395.96222, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.728, "r_y0": 403.89749, "r_x1": 243.00113999999996, "r_y1": 403.89749, "r_x2": 243.00113999999996, "r_y2": 395.88153, "r_x3": 186.728, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 415.1684900000001, "r_x1": 65.334427, "r_y1": 415.1684900000001, "r_x2": 65.334427, "r_y2": 407.15253000000007, "r_x3": 54.595001, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.637054, "r_y0": 415.1684900000001, "r_x1": 286.35852, "r_y1": 415.1684900000001, "r_x2": 286.35852, "r_y2": 407.15253000000007, "r_x3": 67.637054, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 426.12747, "r_x1": 147.13306, "r_y1": 426.12747, "r_x2": 147.13306, "r_y2": 418.11151, "r_x3": 70.030998, "r_y3": 418.11151, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15601, "r_y0": 425.92126, "r_x1": 286.35989, "r_y1": 425.92126, "r_x2": 286.35989, "r_y2": 418.1922, "r_x3": 149.15601, "r_y3": 418.1922, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.88025, "r_x1": 213.48445, "r_y1": 436.88025, "r_x2": 213.48445, "r_y2": 429.15118, "r_x3": 70.031006, "r_y3": 429.15118, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.483, "r_y0": 437.08646000000005, "r_x1": 261.04083, "r_y1": 437.08646000000005, "r_x2": 261.04083, "r_y2": 429.07050000000004, "r_x3": 213.483, "r_y3": 429.07050000000004, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 448.3584599999999, "r_x1": 65.399307, "r_y1": 448.3584599999999, "r_x2": 65.399307, "r_y2": 440.3424999999999, "r_x3": 50.112, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693321, "r_y0": 448.3584599999999, "r_x1": 286.3587, "r_y1": 448.3584599999999, "r_x2": 286.3587, "r_y2": 440.3424999999999, "r_x3": 67.693321, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 459.31747, "r_x1": 202.74268, "r_y1": 459.31747, "r_x2": 202.74268, "r_y2": 451.30151, "r_x3": 70.030998, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.00122, "r_y0": 459.31747, "r_x1": 286.36331, "r_y1": 459.31747, "r_x2": 286.36331, "r_y2": 451.30151, "r_x3": 209.00122, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 470.27646, "r_x1": 286.36334, "r_y1": 470.27646, "r_x2": 286.36334, "r_y2": 462.2605, "r_x3": 70.030998, "r_y3": 462.2605, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 481.23544, "r_x1": 141.86981, "r_y1": 481.23544, "r_x2": 141.86981, "r_y2": 473.21948, "r_x3": 70.030998, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.097, "r_y0": 481.02924, "r_x1": 166.01561, "r_y1": 481.02924, "r_x2": 166.01561, "r_y2": 473.30017, "r_x3": 145.097, "r_y3": 473.30017, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.015, "r_y0": 481.23544, "r_x1": 259.90216, "r_y1": 481.23544, "r_x2": 259.90216, "r_y2": 473.21948, "r_x3": 166.015, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.50644, "r_x1": 66.033806, "r_y1": 492.50644, "r_x2": 66.033806, "r_y2": 484.49048, "r_x3": 50.112, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.423035, "r_y0": 492.50644, "r_x1": 286.35873, "r_y1": 492.50644, "r_x2": 286.35873, "r_y2": 484.49048, "r_x3": 68.423035, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 503.46542, "r_x1": 286.36331, "r_y1": 503.46542, "r_x2": 286.36331, "r_y2": 495.44946, "r_x3": 70.030998, "r_y3": 495.44946, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 514.2182, "r_x1": 227.40926, "r_y1": 514.2182, "r_x2": 227.40926, "r_y2": 506.48914, "r_x3": 70.030998, "r_y3": 506.48914, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.40500000000003, "r_y0": 514.4244100000001, "r_x1": 286.35913, "r_y1": 514.4244100000001, "r_x2": 286.35913, "r_y2": 506.40845, "r_x3": 227.40500000000003, "r_y3": 506.40845, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 525.38339, "r_x1": 286.36328, "r_y1": 525.38339, "r_x2": 286.36328, "r_y2": 517.36743, "r_x3": 70.031006, "r_y3": 517.36743, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 536.34238, "r_x1": 112.36138000000001, "r_y1": 536.34238, "r_x2": 112.36138000000001, "r_y2": 528.32642, "r_x3": 70.031006, "r_y3": 528.32642, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 547.61438, "r_x1": 65.466705, "r_y1": 547.61438, "r_x2": 65.466705, "r_y2": 539.59842, "r_x3": 50.112007, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.770828, "r_y0": 547.61438, "r_x1": 286.35873, "r_y1": 547.61438, "r_x2": 286.35873, "r_y2": 539.59842, "r_x3": 67.770828, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 558.57338, "r_x1": 136.28374, "r_y1": 558.57338, "r_x2": 136.28374, "r_y2": 550.55742, "r_x3": 70.031006, "r_y3": 550.55742, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.811, "r_y0": 558.36716, "r_x1": 286.36206, "r_y1": 558.36716, "r_x2": 286.36206, "r_y2": 550.63812, "r_x3": 138.811, "r_y3": 550.63812, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 569.32616, "r_x1": 286.36334, "r_y1": 569.32616, "r_x2": 286.36334, "r_y2": 561.5971199999999, "r_x3": 70.031006, "r_y3": 561.5971199999999, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 580.28516, "r_x1": 74.514206, "r_y1": 580.28516, "r_x2": 74.514206, "r_y2": 572.55612, "r_x3": 70.031006, "r_y3": 572.55612, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.514008, "r_y0": 580.4913799999999, "r_x1": 286.36313, "r_y1": 580.4913799999999, "r_x2": 286.36313, "r_y2": 572.47542, "r_x3": 74.514008, "r_y3": 572.47542, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 591.44937, "r_x1": 90.357834, "r_y1": 591.44937, "r_x2": 90.357834, "r_y2": 583.4334100000001, "r_x3": 70.031006, "r_y3": 583.4334100000001, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 602.72137, "r_x1": 66.270439, "r_y1": 602.72137, "r_x2": 66.270439, "r_y2": 594.70541, "r_x3": 50.112007, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.695168, "r_y0": 602.72137, "r_x1": 286.35873, "r_y1": 602.72137, "r_x2": 286.35873, "r_y2": 594.70541, "r_x3": 68.695168, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 613.68037, "r_x1": 286.3631, "r_y1": 613.68037, "r_x2": 286.3631, "r_y2": 605.66441, "r_x3": 70.031006, "r_y3": 605.66441, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 624.63937, "r_x1": 286.36331, "r_y1": 624.63937, "r_x2": 286.36331, "r_y2": 616.62341, "r_x3": 70.031006, "r_y3": 616.62341, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 635.5983699999999, "r_x1": 77.500015, "r_y1": 635.5983699999999, "r_x2": 77.500015, "r_y2": 627.58241, "r_x3": 70.031006, "r_y3": 627.58241, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.920006, "r_y0": 635.39215, "r_x1": 286.3624, "r_y1": 635.39215, "r_x2": 286.3624, "r_y2": 627.6631199999999, "r_x3": 79.920006, "r_y3": 627.6631199999999, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 646.35115, "r_x1": 140.67728, "r_y1": 646.35115, "r_x2": 140.67728, "r_y2": 638.62212, "r_x3": 70.031006, "r_y3": 638.62212, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.67599, "r_y0": 646.55737, "r_x1": 264.43921, "r_y1": 646.55737, "r_x2": 264.43921, "r_y2": 638.54141, "r_x3": 140.67599, "r_y3": 638.54141, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 657.82938, "r_x1": 66.534035, "r_y1": 657.82938, "r_x2": 66.534035, "r_y2": 649.81342, "r_x3": 50.111992, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.998329, "r_y0": 657.82938, "r_x1": 286.35873, "r_y1": 657.82938, "r_x2": 286.35873, "r_y2": 649.81342, "r_x3": 68.998329, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 668.78738, "r_x1": 93.200165, "r_y1": 668.78738, "r_x2": 93.200165, "r_y2": 660.77142, "r_x3": 70.030991, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.20243, "r_y0": 668.78738, "r_x1": 286.36334, "r_y1": 668.78738, "r_x2": 286.36334, "r_y2": 660.77142, "r_x3": 102.20243, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 679.74638, "r_x1": 171.9969, "r_y1": 679.74638, "r_x2": 171.9969, "r_y2": 671.73042, "r_x3": 70.030991, "r_y3": 671.73042, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 691.01839, "r_x1": 65.515968, "r_y1": 691.01839, "r_x2": 65.515968, "r_y2": 683.00243, "r_x3": 50.111992, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.827499, "r_y0": 691.01839, "r_x1": 286.3587, "r_y1": 691.01839, "r_x2": 286.3587, "r_y2": 683.00243, "r_x3": 67.827499, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 701.977386, "r_x1": 102.15761, "r_y1": 701.977386, "r_x2": 102.15761, "r_y2": 693.9614260000001, "r_x3": 70.030991, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.54999, "r_y0": 701.771156, "r_x1": 231.47461, "r_y1": 701.771156, "r_x2": 231.47461, "r_y2": 694.0421220000001, "r_x3": 107.54999, "r_y3": 694.0421220000001, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.47598, "r_y0": 701.977386, "r_x1": 286.35931, "r_y1": 701.977386, "r_x2": 286.35931, "r_y2": 693.9614260000001, "r_x3": 231.47598, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 712.936386, "r_x1": 97.916481, "r_y1": 712.936386, "r_x2": 97.916481, "r_y2": 704.920425, "r_x3": 70.030975, "r_y3": 704.920425, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 83.89940999999999, "r_x1": 324.74973, "r_y1": 83.89940999999999, "r_x2": 324.74973, "r_y2": 75.88342000000011, "r_x3": 308.86197, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13382, "r_y0": 83.89940999999999, "r_x1": 545.1087, "r_y1": 83.89940999999999, "r_x2": 545.1087, "r_y2": 75.88342000000011, "r_x3": 327.13382, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 94.85741999999993, "r_x1": 545.1134, "r_y1": 94.85741999999993, "r_x2": 545.1134, "r_y2": 86.84142999999995, "r_x3": 328.78098, "r_y3": 86.84142999999995, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 105.81641000000002, "r_x1": 390.96295, "r_y1": 105.81641000000002, "r_x2": 390.96295, "r_y2": 97.80042000000003, "r_x3": 328.78098, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27008, "r_y0": 105.81641000000002, "r_x1": 435.1404099999999, "r_y1": 105.81641000000002, "r_x2": 435.1404099999999, "r_y2": 97.80042000000003, "r_x3": 400.27008, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71277, "r_y0": 105.81641000000002, "r_x1": 545.11328, "r_y1": 105.81641000000002, "r_x2": 545.11328, "r_y2": 97.80042000000003, "r_x3": 441.71277, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 116.7753899999999, "r_x1": 440.80719, "r_y1": 116.7753899999999, "r_x2": 440.80719, "r_y2": 108.75940000000003, "r_x3": 328.78098, "r_y3": 108.75940000000003, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63498, "r_y0": 116.56914999999992, "r_x1": 545.11304, "r_y1": 116.56914999999992, "r_x2": 545.11304, "r_y2": 108.84009000000003, "r_x3": 446.63498, "r_y3": 108.84009000000003, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 127.52814000000001, "r_x1": 471.13153, "r_y1": 127.52814000000001, "r_x2": 471.13153, "r_y2": 119.79907000000003, "r_x3": 328.78098, "r_y3": 119.79907000000003, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13300000000004, "r_y0": 127.73437999999999, "r_x1": 545.11475, "r_y1": 127.73437999999999, "r_x2": 545.11475, "r_y2": 119.71838000000002, "r_x3": 471.13300000000004, "r_y3": 119.71838000000002, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 138.69335999999998, "r_x1": 356.6665, "r_y1": 138.69335999999998, "r_x2": 356.6665, "r_y2": 130.67737, "r_x3": 328.78101, "r_y3": 130.67737, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 150.13933999999995, "r_x1": 325.24371, "r_y1": 150.13933999999995, "r_x2": 325.24371, "r_y2": 142.12334999999996, "r_x3": 308.862, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.70197, "r_y0": 150.13933999999995, "r_x1": 545.10883, "r_y1": 150.13933999999995, "r_x2": 545.10883, "r_y2": 142.12334999999996, "r_x3": 327.70197, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.09735, "r_x1": 414.44598, "r_y1": 161.09735, "r_x2": 414.44598, "r_y2": 153.08136000000002, "r_x3": 328.78101, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.82532, "r_y0": 161.09735, "r_x1": 545.1134, "r_y1": 161.09735, "r_x2": 545.1134, "r_y2": 153.08136000000002, "r_x3": 421.82532, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 172.05633999999998, "r_x1": 493.62835999999993, "r_y1": 172.05633999999998, "r_x2": 493.62835999999993, "r_y2": 164.04034000000001, "r_x3": 328.78101, "r_y3": 164.04034000000001, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.50232000000005, "r_x1": 324.26599, "r_y1": 183.50232000000005, "r_x2": 324.26599, "r_y2": 175.48632999999995, "r_x3": 308.862, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57751, "r_y0": 183.50232000000005, "r_x1": 545.10876, "r_y1": 183.50232000000005, "r_x2": 545.10876, "r_y2": 175.48632999999995, "r_x3": 326.57751, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 194.46130000000005, "r_x1": 545.11334, "r_y1": 194.46130000000005, "r_x2": 545.11334, "r_y2": 186.44530999999995, "r_x3": 328.78101, "r_y3": 186.44530999999995, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 205.42029000000002, "r_x1": 545.11346, "r_y1": 205.42029000000002, "r_x2": 545.11346, "r_y2": 197.40430000000003, "r_x3": 328.78101, "r_y3": 197.40430000000003, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 216.37927000000002, "r_x1": 545.11353, "r_y1": 216.37927000000002, "r_x2": 545.11353, "r_y2": 208.36328000000003, "r_x3": 328.78101, "r_y3": 208.36328000000003, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 227.33826, "r_x1": 479.26413, "r_y1": 227.33826, "r_x2": 479.26413, "r_y2": 219.32227, "r_x3": 328.78101, "r_y3": 219.32227, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 227.13202, "r_x1": 545.11273, "r_y1": 227.13202, "r_x2": 545.11273, "r_y2": 219.40295000000003, "r_x3": 483.11902, "r_y3": 219.40295000000003, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 238.09002999999996, "r_x1": 519.39771, "r_y1": 238.09002999999996, "r_x2": 519.39771, "r_y2": 230.36095999999998, "r_x3": 328.78101, "r_y3": 230.36095999999998, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.401, "r_y0": 238.29625999999996, "r_x1": 545.10767, "r_y1": 238.29625999999996, "r_x2": 545.10767, "r_y2": 230.28026999999997, "r_x3": 519.401, "r_y3": 230.28026999999997, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 249.25525000000005, "r_x1": 545.11328, "r_y1": 249.25525000000005, "r_x2": 545.11328, "r_y2": 241.23925999999994, "r_x3": 328.78101, "r_y3": 241.23925999999994, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 260.21423000000004, "r_x1": 333.26422, "r_y1": 260.21423000000004, "r_x2": 333.26422, "r_y2": 252.19824000000006, "r_x3": 328.78101, "r_y3": 252.19824000000006, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 271.66022, "r_x1": 324.26477, "r_y1": 271.66022, "r_x2": 324.26477, "r_y2": 263.64423, "r_x3": 308.862, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57611, "r_y0": 271.66022, "r_x1": 545.10883, "r_y1": 271.66022, "r_x2": 545.10883, "r_y2": 263.64423, "r_x3": 326.57611, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 282.61917000000005, "r_x1": 545.1134, "r_y1": 282.61917000000005, "r_x2": 545.1134, "r_y2": 274.60321, "r_x3": 328.78101, "r_y3": 274.60321, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 293.57816, "r_x1": 545.11328, "r_y1": 293.57816, "r_x2": 545.11328, "r_y2": 285.56219, "r_x3": 328.78101, "r_y3": 285.56219, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 304.53714, "r_x1": 545.11334, "r_y1": 304.53714, "r_x2": 545.11334, "r_y2": 296.52118, "r_x3": 328.78101, "r_y3": 296.52118, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 315.49515, "r_x1": 352.84683, "r_y1": 315.49515, "r_x2": 352.84683, "r_y2": 307.47919, "r_x3": 328.78101, "r_y3": 307.47919, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.23599, "r_y0": 315.28894, "r_x1": 545.1142, "r_y1": 315.28894, "r_x2": 545.1142, "r_y2": 307.55988, "r_x3": 360.23599, "r_y3": 307.55988, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 326.24792, "r_x1": 371.02173, "r_y1": 326.24792, "r_x2": 371.02173, "r_y2": 318.51886, "r_x3": 328.78101, "r_y3": 318.51886, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.021, "r_y0": 326.45413, "r_x1": 502.26227, "r_y1": 326.45413, "r_x2": 502.26227, "r_y2": 318.43817, "r_x3": 371.021, "r_y3": 318.43817, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.90015, "r_x1": 323.82672, "r_y1": 337.90015, "r_x2": 323.82672, "r_y2": 329.88419, "r_x3": 308.862, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07233, "r_y0": 337.90015, "r_x1": 545.10876, "r_y1": 337.90015, "r_x2": 545.10876, "r_y2": 329.88419, "r_x3": 326.07233, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 348.85916, "r_x1": 545.11346, "r_y1": 348.85916, "r_x2": 545.11346, "r_y2": 340.8432, "r_x3": 328.78101, "r_y3": 340.8432, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 359.81815000000006, "r_x1": 382.7767, "r_y1": 359.81815000000006, "r_x2": 382.7767, "r_y2": 351.80219000000005, "r_x3": 328.78101, "r_y3": 351.80219000000005, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54102, "r_y0": 359.61194, "r_x1": 545.11609, "r_y1": 359.61194, "r_x2": 545.11609, "r_y2": 351.88287, "r_x3": 385.54102, "r_y3": 351.88287, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 370.57092, "r_x1": 443.59579, "r_y1": 370.57092, "r_x2": 443.59579, "r_y2": 362.84186, "r_x3": 328.78101, "r_y3": 362.84186, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59399, "r_y0": 370.77713, "r_x1": 534.48645, "r_y1": 370.77713, "r_x2": 534.48645, "r_y2": 362.76117, "r_x3": 443.59399, "r_y3": 362.76117, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 382.22214, "r_x1": 324.60281, "r_y1": 382.22214, "r_x2": 324.60281, "r_y2": 374.20618, "r_x3": 308.862, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96487, "r_y0": 382.22214, "r_x1": 362.6604, "r_y1": 382.22214, "r_x2": 362.6604, "r_y2": 374.20618, "r_x3": 326.96487, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69479, "r_y0": 382.22214, "r_x1": 389.6134, "r_y1": 382.22214, "r_x2": 389.6134, "r_y2": 374.20618, "r_x3": 368.69479, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.6478, "r_y0": 382.22214, "r_x1": 424.56445, "r_y1": 382.22214, "r_x2": 424.56445, "r_y2": 374.20618, "r_x3": 395.6478, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.5492899999999, "r_y0": 382.22214, "r_x1": 438.0230399999999, "r_y1": 382.22214, "r_x2": 438.0230399999999, "r_y2": 374.20618, "r_x3": 431.5492899999999, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.05743, "r_y0": 382.22214, "r_x1": 488.5038799999999, "r_y1": 382.22214, "r_x2": 488.5038799999999, "r_y2": 374.20618, "r_x3": 444.05743, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.47974, "r_y0": 382.22214, "r_x1": 515.41205, "r_y1": 382.22214, "r_x2": 515.41205, "r_y2": 374.20618, "r_x3": 495.47974, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.44641, "r_y0": 382.22214, "r_x1": 545.10876, "r_y1": 382.22214, "r_x2": 545.10876, "r_y2": 374.20618, "r_x3": 521.44641, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 393.18112, "r_x1": 545.1134, "r_y1": 393.18112, "r_x2": 545.1134, "r_y2": 385.16516, "r_x3": 328.78101, "r_y3": 385.16516, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 404.14011, "r_x1": 545.11346, "r_y1": 404.14011, "r_x2": 545.11346, "r_y2": 396.12415, "r_x3": 328.78101, "r_y3": 396.12415, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 415.09909, "r_x1": 478.00881999999996, "r_y1": 415.09909, "r_x2": 478.00881999999996, "r_y2": 407.08313, "r_x3": 328.78101, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.0701, "r_y0": 415.09909, "r_x1": 491.53912, "r_y1": 415.09909, "r_x2": 491.53912, "r_y2": 407.08313, "r_x3": 484.0701, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.668, "r_y0": 414.89288, "r_x1": 545.11298, "r_y1": 414.89288, "r_x2": 545.11298, "r_y2": 407.16382, "r_x3": 494.668, "r_y3": 407.16382, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 425.85187, "r_x1": 545.11334, "r_y1": 425.85187, "r_x2": 545.11334, "r_y2": 418.12280000000004, "r_x3": 328.78101, "r_y3": 418.12280000000004, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 436.8108500000001, "r_x1": 360.83591, "r_y1": 436.8108500000001, "r_x2": 360.83591, "r_y2": 429.08179, "r_x3": 328.78101, "r_y3": 429.08179, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.836, "r_y0": 437.01706, "r_x1": 475.63287, "r_y1": 437.01706, "r_x2": 475.63287, "r_y2": 429.0011, "r_x3": 360.836, "r_y3": 429.0011, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.46207, "r_x1": 324.57407, "r_y1": 448.46207, "r_x2": 324.57407, "r_y2": 440.44611, "r_x3": 308.862, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93179, "r_y0": 448.46207, "r_x1": 545.1087, "r_y1": 448.46207, "r_x2": 545.1087, "r_y2": 440.44611, "r_x3": 326.93179, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 459.42105, "r_x1": 545.11346, "r_y1": 459.42105, "r_x2": 545.11346, "r_y2": 451.40509, "r_x3": 328.78101, "r_y3": 451.40509, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 470.38004, "r_x1": 545.11328, "r_y1": 470.38004, "r_x2": 545.11328, "r_y2": 462.36407, "r_x3": 328.78101, "r_y3": 462.36407, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 481.33902, "r_x1": 545.11328, "r_y1": 481.33902, "r_x2": 545.11328, "r_y2": 473.32306, "r_x3": 328.78101, "r_y3": 473.32306, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 492.298, "r_x1": 545.11328, "r_y1": 492.298, "r_x2": 545.11328, "r_y2": 484.28204, "r_x3": 328.78101, "r_y3": 484.28204, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 503.25699, "r_x1": 545.1134, "r_y1": 503.25699, "r_x2": 545.1134, "r_y2": 495.24103, "r_x3": 328.78101, "r_y3": 495.24103, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 514.21597, "r_x1": 545.1134, "r_y1": 514.21597, "r_x2": 545.1134, "r_y2": 506.20001, "r_x3": 328.78101, "r_y3": 506.20001, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 525.17496, "r_x1": 545.1098, "r_y1": 525.17496, "r_x2": 545.1098, "r_y2": 517.159, "r_x3": 328.78101, "r_y3": 517.159, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 536.13297, "r_x1": 434.56659, "r_y1": 536.13297, "r_x2": 434.56659, "r_y2": 528.117, "r_x3": 328.78101, "r_y3": 528.117, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86401, "r_y0": 535.9267600000001, "r_x1": 545.11115, "r_y1": 535.9267600000001, "r_x2": 545.11115, "r_y2": 528.19769, "r_x3": 437.86401, "r_y3": 528.19769, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 546.8857399999999, "r_x1": 425.73471, "r_y1": 546.8857399999999, "r_x2": 425.73471, "r_y2": 539.15671, "r_x3": 328.78101, "r_y3": 539.15671, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.73602, "r_y0": 547.09196, "r_x1": 545.11475, "r_y1": 547.09196, "r_x2": 545.11475, "r_y2": 539.076, "r_x3": 425.73602, "r_y3": 539.076, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 558.05096, "r_x1": 399.74109, "r_y1": 558.05096, "r_x2": 399.74109, "r_y2": 550.035, "r_x3": 328.78101, "r_y3": 550.035, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.49696, "r_x1": 324.50351, "r_y1": 569.49696, "r_x2": 324.50351, "r_y2": 561.481, "r_x3": 308.862, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85068, "r_y0": 569.49696, "r_x1": 545.10876, "r_y1": 569.49696, "r_x2": 545.10876, "r_y2": 561.481, "r_x3": 326.85068, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 580.45596, "r_x1": 545.1134, "r_y1": 580.45596, "r_x2": 545.1134, "r_y2": 572.44, "r_x3": 328.78101, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 591.4149600000001, "r_x1": 545.11334, "r_y1": 591.4149600000001, "r_x2": 545.11334, "r_y2": 583.399, "r_x3": 328.78101, "r_y3": 583.399, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 602.37396, "r_x1": 431.61667, "r_y1": 602.37396, "r_x2": 431.61667, "r_y2": 594.358, "r_x3": 328.78101, "r_y3": 594.358, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69101000000006, "r_y0": 602.16774, "r_x1": 545.11224, "r_y1": 602.16774, "r_x2": 545.11224, "r_y2": 594.4387099999999, "r_x3": 434.69101000000006, "r_y3": 594.4387099999999, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 613.12575, "r_x1": 545.1134, "r_y1": 613.12575, "r_x2": 545.1134, "r_y2": 605.39671, "r_x3": 328.78101, "r_y3": 605.39671, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 624.08475, "r_x1": 367.8028, "r_y1": 624.08475, "r_x2": 367.8028, "r_y2": 616.35571, "r_x3": 328.78101, "r_y3": 616.35571, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.802, "r_y0": 624.29097, "r_x1": 458.69446000000005, "r_y1": 624.29097, "r_x2": 458.69446000000005, "r_y2": 616.2750100000001, "r_x3": 367.802, "r_y3": 616.2750100000001, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 635.73697, "r_x1": 324.69476, "r_y1": 635.73697, "r_x2": 324.69476, "r_y2": 627.72101, "r_x3": 308.862, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07065, "r_y0": 635.73697, "r_x1": 545.1087, "r_y1": 635.73697, "r_x2": 545.1087, "r_y2": 627.72101, "r_x3": 327.07065, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 646.69597, "r_x1": 545.11328, "r_y1": 646.69597, "r_x2": 545.11328, "r_y2": 638.68001, "r_x3": 328.78101, "r_y3": 638.68001, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 657.65497, "r_x1": 336.25003, "r_y1": 657.65497, "r_x2": 336.25003, "r_y2": 649.63901, "r_x3": 328.78101, "r_y3": 649.63901, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.10001, "r_y0": 657.44875, "r_x1": 545.11621, "r_y1": 657.44875, "r_x2": 545.11621, "r_y2": 649.71971, "r_x3": 338.10001, "r_y3": 649.71971, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 668.40775, "r_x1": 406.32245, "r_y1": 668.40775, "r_x2": 406.32245, "r_y2": 660.67871, "r_x3": 328.78101, "r_y3": 660.67871, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 668.61398, "r_x1": 521.1189, "r_y1": 668.61398, "r_x2": 521.1189, "r_y2": 660.5980099999999, "r_x3": 406.32202, "r_y3": 660.5980099999999, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 680.05898, "r_x1": 324.71329, "r_y1": 680.05898, "r_x2": 324.71329, "r_y2": 672.04301, "r_x3": 308.86203, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09195, "r_y0": 680.05898, "r_x1": 545.10876, "r_y1": 680.05898, "r_x2": 545.10876, "r_y2": 672.04301, "r_x3": 327.09195, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 691.01797, "r_x1": 482.81488, "r_y1": 691.01797, "r_x2": 482.81488, "r_y2": 683.0020099999999, "r_x3": 328.78104, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75064, "r_y0": 691.01797, "r_x1": 545.1134, "r_y1": 691.01797, "r_x2": 545.1134, "r_y2": 683.0020099999999, "r_x3": 488.75064, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 701.976974, "r_x1": 545.11334, "r_y1": 701.976974, "r_x2": 545.11334, "r_y2": 693.961014, "r_x3": 328.78104, "r_y3": 693.961014, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 712.935974, "r_x1": 379.1543, "r_y1": 712.935974, "r_x2": 379.1543, "r_y2": 704.920013, "r_x3": 328.78104, "r_y3": 704.920013, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.61603, "r_y0": 712.729744, "r_x1": 545.10938, "r_y1": 712.729744, "r_x2": 545.10938, "r_y2": 705.00071, "r_x3": 381.61603, "r_y3": 705.00071, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.0391500000001, "r_x1": 300.10233, "r_y1": 743.0391500000001, "r_x2": 300.10233, "r_y2": 734.1325870000001, "r_x3": 295.12103, "r_y3": 734.1325870000001, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 25, "label": "list_item", "bbox": { "l": 70.030998, "t": 75.88378999999998, "r": 286.36334, "b": 116.77575999999999, "coord_origin": "TOPLEFT" }, "confidence": 0.7310384511947632, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.89977999999996, "r_x1": 286.36334, "r_y1": 83.89977999999996, "r_x2": 286.36334, "r_y2": 75.88378999999998, "r_x3": 70.030998, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 94.85875999999996, "r_x1": 286.36331, "r_y1": 94.85875999999996, "r_x2": 286.36331, "r_y2": 86.84276999999997, "r_x3": 70.030998, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 105.81677000000002, "r_x1": 85.722198, "r_y1": 105.81677000000002, "r_x2": 85.722198, "r_y2": 97.80078000000003, "r_x3": 70.030998, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.889, "r_y0": 105.61053000000004, "r_x1": 199.93315, "r_y1": 105.61053000000004, "r_x2": 199.93315, "r_y2": 97.88147000000004, "r_x3": 87.889, "r_y3": 97.88147000000004, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.936, "r_y0": 105.81677000000002, "r_x1": 286.36313, "r_y1": 105.81677000000002, "r_x2": 286.36313, "r_y2": 97.80078000000003, "r_x3": 199.936, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 116.77575999999999, "r_x1": 221.94871999999998, "r_y1": 116.77575999999999, "r_x2": 221.94871999999998, "r_y2": 108.75977, "r_x3": 70.031006, "r_y3": 108.75977, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 54.595005, "t": 120.03174000000013, "r": 286.36334, "b": 149.96569999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9372755885124207, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595005, "r_y0": 128.04773, "r_x1": 65.206657, "r_y1": 128.04773, "r_x2": 65.206657, "r_y2": 120.03174000000013, "r_x3": 54.595005, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.481873, "r_y0": 128.04773, "r_x1": 286.35852, "r_y1": 128.04773, "r_x2": 286.35852, "r_y2": 120.03174000000013, "r_x3": 67.481873, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.00671, "r_x1": 179.67215, "r_y1": 139.00671, "r_x2": 179.67215, "r_y2": 130.99072, "r_x3": 70.031006, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58101, "r_y0": 139.00671, "r_x1": 286.36334, "r_y1": 139.00671, "r_x2": 286.36334, "r_y2": 130.99072, "r_x3": 185.58101, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.96569999999997, "r_x1": 113.11456, "r_y1": 149.96569999999997, "r_x2": 113.11456, "r_y2": 141.94970999999998, "r_x3": 70.031006, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34200999999999, "r_y0": 149.75946, "r_x1": 235.3082, "r_y1": 149.75946, "r_x2": 235.3082, "r_y2": 142.0304, "r_x3": 116.34200999999999, "r_y3": 142.0304, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.30701, "r_y0": 149.96569999999997, "r_x1": 267.67572, "r_y1": 149.96569999999997, "r_x2": 267.67572, "r_y2": 141.94970999999998, "r_x3": 235.30701, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 54.595001, "t": 153.22168, "r": 286.36301, "b": 183.15466000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9378374218940735, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 161.23766999999998, "r_x1": 65.103195, "r_y1": 161.23766999999998, "r_x2": 65.103195, "r_y2": 153.22168, "r_x3": 54.595001, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.356239, "r_y0": 161.23766999999998, "r_x1": 218.77876, "r_y1": 161.23766999999998, "r_x2": 218.77876, "r_y2": 153.22168, "r_x3": 67.356239, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.97999999999996, "r_y0": 161.03143, "r_x1": 286.36301, "r_y1": 161.03143, "r_x2": 286.36301, "r_y2": 153.30237, "r_x3": 220.97999999999996, "r_y3": 153.30237, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 171.99041999999997, "r_x1": 125.26401000000001, "r_y1": 171.99041999999997, "r_x2": 125.26401000000001, "r_y2": 164.26135, "r_x3": 70.030991, "r_y3": 164.26135, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26098999999999, "r_y0": 172.19665999999995, "r_x1": 286.36029, "r_y1": 172.19665999999995, "r_x2": 286.36029, "r_y2": 164.18066, "r_x3": 125.26098999999999, "r_y3": 164.18066, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 183.15466000000004, "r_x1": 97.916496, "r_y1": 183.15466000000004, "r_x2": 97.916496, "r_y2": 175.13867000000005, "r_x3": 70.030991, "r_y3": 175.13867000000005, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 54.59499, "t": 186.41063999999994, "r": 286.36401, "b": 227.30358999999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9648825526237488, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 194.42664000000002, "r_x1": 65.806984, "r_y1": 194.42664000000002, "r_x2": 65.806984, "r_y2": 186.41063999999994, "r_x3": 54.59499, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.210922, "r_y0": 194.42664000000002, "r_x1": 286.36401, "r_y1": 194.42664000000002, "r_x2": 286.36401, "r_y2": 186.41063999999994, "r_x3": 68.210922, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 205.38562000000002, "r_x1": 286.36331, "r_y1": 205.38562000000002, "r_x2": 286.36331, "r_y2": 197.36963000000003, "r_x3": 70.030983, "r_y3": 197.36963000000003, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 216.3446, "r_x1": 286.36334, "r_y1": 216.3446, "r_x2": 286.36334, "r_y2": 208.32861000000003, "r_x3": 70.030983, "r_y3": 208.32861000000003, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 227.30358999999999, "r_x1": 245.83519, "r_y1": 227.30358999999999, "r_x2": 245.83519, "r_y2": 219.2876, "r_x3": 70.030983, "r_y3": 219.2876, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 54.594982, "t": 230.55957, "r": 286.36334, "b": 271.45154, "coord_origin": "TOPLEFT" }, "confidence": 0.9620943069458008, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594982, "r_y0": 238.57556, "r_x1": 65.381134, "r_y1": 238.57556, "r_x2": 65.381134, "r_y2": 230.55957, "r_x3": 54.594982, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693779, "r_y0": 238.57556, "r_x1": 286.35849, "r_y1": 238.57556, "r_x2": 286.35849, "r_y2": 230.55957, "r_x3": 67.693779, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 249.53454999999997, "r_x1": 286.36334, "r_y1": 249.53454999999997, "r_x2": 286.36334, "r_y2": 241.51855, "r_x3": 70.030983, "r_y3": 241.51855, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 260.49255000000005, "r_x1": 108.39821, "r_y1": 260.49255000000005, "r_x2": 108.39821, "r_y2": 252.47655999999995, "r_x3": 70.030983, "r_y3": 252.47655999999995, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64498000000002, "r_y0": 260.28632000000005, "r_x1": 286.3595, "r_y1": 260.28632000000005, "r_x2": 286.3595, "r_y2": 252.55724999999995, "r_x3": 110.64498000000002, "r_y3": 252.55724999999995, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 271.24530000000004, "r_x1": 140.57861, "r_y1": 271.24530000000004, "r_x2": 140.57861, "r_y2": 263.51624000000004, "r_x3": 70.030983, "r_y3": 263.51624000000004, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.57797, "r_y0": 271.45154, "r_x1": 266.47522, "r_y1": 271.45154, "r_x2": 266.47522, "r_y2": 263.43555000000003, "r_x3": 140.57797, "r_y3": 263.43555000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 54.594971, "t": 274.70758, "r": 286.36676, "b": 315.6004899999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9555517435073853, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594971, "r_y0": 282.72351, "r_x1": 64.848648, "r_y1": 282.72351, "r_x2": 64.848648, "r_y2": 274.70758, "r_x3": 54.594971, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.047119, "r_y0": 282.72351, "r_x1": 286.36676, "r_y1": 282.72351, "r_x2": 286.36676, "r_y2": 274.70758, "r_x3": 67.047119, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 293.68253, "r_x1": 179.57349, "r_y1": 293.68253, "r_x2": 179.57349, "r_y2": 285.66655999999995, "r_x3": 70.030975, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.01559, "r_y0": 293.68253, "r_x1": 194.4846, "r_y1": 293.68253, "r_x2": 194.4846, "r_y2": 285.66655999999995, "r_x3": 187.01559, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04398, "r_y0": 293.47632, "r_x1": 286.36304, "r_y1": 293.47632, "r_x2": 286.36304, "r_y2": 285.74725, "r_x3": 198.04398, "r_y3": 285.74725, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 304.43530000000004, "r_x1": 260.19937, "r_y1": 304.43530000000004, "r_x2": 260.19937, "r_y2": 296.70624, "r_x3": 70.030975, "r_y3": 296.70624, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.198, "r_y0": 304.64151, "r_x1": 286.36197, "r_y1": 304.64151, "r_x2": 286.36197, "r_y2": 296.62555, "r_x3": 260.198, "r_y3": 296.62555, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 315.6004899999999, "r_x1": 142.74849, "r_y1": 315.6004899999999, "r_x2": 142.74849, "r_y2": 307.5845299999999, "r_x3": 70.030991, "r_y3": 307.5845299999999, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 54.59499, "t": 318.85654, "r": 286.36319, "b": 348.78952, "coord_origin": "TOPLEFT" }, "confidence": 0.9479843378067017, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 326.8725, "r_x1": 65.61586, "r_y1": 326.8725, "r_x2": 65.61586, "r_y2": 318.85654, "r_x3": 54.59499, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.978821, "r_y0": 326.8725, "r_x1": 199.492, "r_y1": 326.8725, "r_x2": 199.492, "r_y2": 318.85654, "r_x3": 67.978821, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.98792, "r_y0": 326.8725, "r_x1": 286.35849, "r_y1": 326.8725, "r_x2": 286.35849, "r_y2": 318.85654, "r_x3": 206.98792, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 337.83051, "r_x1": 176.28284, "r_y1": 337.83051, "r_x2": 176.28284, "r_y2": 329.8145400000001, "r_x3": 70.030991, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.60416, "r_y0": 337.83051, "r_x1": 190.07317, "r_y1": 337.83051, "r_x2": 190.07317, "r_y2": 329.8145400000001, "r_x3": 182.60416, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28299, "r_y0": 337.62429999999995, "r_x1": 286.36319, "r_y1": 337.62429999999995, "r_x2": 286.36319, "r_y2": 329.89522999999997, "r_x3": 193.28299, "r_y3": 329.89522999999997, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 348.58331, "r_x1": 206.34717, "r_y1": 348.58331, "r_x2": 206.34717, "r_y2": 340.85425, "r_x3": 70.030991, "r_y3": 340.85425, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.34599, "r_y0": 348.78952, "r_x1": 274.82239, "r_y1": 348.78952, "r_x2": 274.82239, "r_y2": 340.77356, "r_x3": 206.34599, "r_y3": 340.77356, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 54.594986000000006, "t": 352.0455600000001, "r": 286.36331, "b": 403.89749, "coord_origin": "TOPLEFT" }, "confidence": 0.9484425187110901, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594986000000006, "r_y0": 360.06152, "r_x1": 65.04657, "r_y1": 360.06152, "r_x2": 65.04657, "r_y2": 352.0455600000001, "r_x3": 54.594986000000006, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.287483, "r_y0": 360.06152, "r_x1": 286.35849, "r_y1": 360.06152, "r_x2": 286.35849, "r_y2": 352.0455600000001, "r_x3": 67.287483, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 371.02054, "r_x1": 234.12507999999997, "r_y1": 371.02054, "r_x2": 234.12507999999997, "r_y2": 363.00458, "r_x3": 70.030983, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05186, "r_y0": 371.02054, "r_x1": 286.36331, "r_y1": 371.02054, "r_x2": 286.36331, "r_y2": 363.00458, "r_x3": 240.05186, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 381.97952, "r_x1": 286.36331, "r_y1": 381.97952, "r_x2": 286.36331, "r_y2": 373.96356, "r_x3": 70.030983, "r_y3": 373.96356, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 392.93851, "r_x1": 286.36331, "r_y1": 392.93851, "r_x2": 286.36331, "r_y2": 384.92255, "r_x3": 70.030983, "r_y3": 384.92255, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 403.89749, "r_x1": 114.57605, "r_y1": 403.89749, "r_x2": 114.57605, "r_y2": 395.88153, "r_x3": 70.030983, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.80399000000001, "r_y0": 403.69128, "r_x1": 186.7287, "r_y1": 403.69128, "r_x2": 186.7287, "r_y2": 395.96222, "r_x3": 117.80399000000001, "r_y3": 395.96222, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.728, "r_y0": 403.89749, "r_x1": 243.00113999999996, "r_y1": 403.89749, "r_x2": 243.00113999999996, "r_y2": 395.88153, "r_x3": 186.728, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 54.595001, "t": 407.15253000000007, "r": 286.35989, "b": 437.08646000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9330756664276123, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 415.1684900000001, "r_x1": 65.334427, "r_y1": 415.1684900000001, "r_x2": 65.334427, "r_y2": 407.15253000000007, "r_x3": 54.595001, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.637054, "r_y0": 415.1684900000001, "r_x1": 286.35852, "r_y1": 415.1684900000001, "r_x2": 286.35852, "r_y2": 407.15253000000007, "r_x3": 67.637054, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 426.12747, "r_x1": 147.13306, "r_y1": 426.12747, "r_x2": 147.13306, "r_y2": 418.11151, "r_x3": 70.030998, "r_y3": 418.11151, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15601, "r_y0": 425.92126, "r_x1": 286.35989, "r_y1": 425.92126, "r_x2": 286.35989, "r_y2": 418.1922, "r_x3": 149.15601, "r_y3": 418.1922, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.88025, "r_x1": 213.48445, "r_y1": 436.88025, "r_x2": 213.48445, "r_y2": 429.15118, "r_x3": 70.031006, "r_y3": 429.15118, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.483, "r_y0": 437.08646000000005, "r_x1": 261.04083, "r_y1": 437.08646000000005, "r_x2": 261.04083, "r_y2": 429.07050000000004, "r_x3": 213.483, "r_y3": 429.07050000000004, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "list_item", "bbox": { "l": 50.112, "t": 440.3424999999999, "r": 286.36334, "b": 481.23544, "coord_origin": "TOPLEFT" }, "confidence": 0.9274735450744629, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 448.3584599999999, "r_x1": 65.399307, "r_y1": 448.3584599999999, "r_x2": 65.399307, "r_y2": 440.3424999999999, "r_x3": 50.112, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693321, "r_y0": 448.3584599999999, "r_x1": 286.3587, "r_y1": 448.3584599999999, "r_x2": 286.3587, "r_y2": 440.3424999999999, "r_x3": 67.693321, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 459.31747, "r_x1": 202.74268, "r_y1": 459.31747, "r_x2": 202.74268, "r_y2": 451.30151, "r_x3": 70.030998, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.00122, "r_y0": 459.31747, "r_x1": 286.36331, "r_y1": 459.31747, "r_x2": 286.36331, "r_y2": 451.30151, "r_x3": 209.00122, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 470.27646, "r_x1": 286.36334, "r_y1": 470.27646, "r_x2": 286.36334, "r_y2": 462.2605, "r_x3": 70.030998, "r_y3": 462.2605, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 481.23544, "r_x1": 141.86981, "r_y1": 481.23544, "r_x2": 141.86981, "r_y2": 473.21948, "r_x3": 70.030998, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.097, "r_y0": 481.02924, "r_x1": 166.01561, "r_y1": 481.02924, "r_x2": 166.01561, "r_y2": 473.30017, "r_x3": 145.097, "r_y3": 473.30017, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.015, "r_y0": 481.23544, "r_x1": 259.90216, "r_y1": 481.23544, "r_x2": 259.90216, "r_y2": 473.21948, "r_x3": 166.015, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "list_item", "bbox": { "l": 50.112, "t": 484.49048, "r": 286.36331, "b": 536.34238, "coord_origin": "TOPLEFT" }, "confidence": 0.9299950003623962, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.50644, "r_x1": 66.033806, "r_y1": 492.50644, "r_x2": 66.033806, "r_y2": 484.49048, "r_x3": 50.112, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.423035, "r_y0": 492.50644, "r_x1": 286.35873, "r_y1": 492.50644, "r_x2": 286.35873, "r_y2": 484.49048, "r_x3": 68.423035, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 503.46542, "r_x1": 286.36331, "r_y1": 503.46542, "r_x2": 286.36331, "r_y2": 495.44946, "r_x3": 70.030998, "r_y3": 495.44946, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 514.2182, "r_x1": 227.40926, "r_y1": 514.2182, "r_x2": 227.40926, "r_y2": 506.48914, "r_x3": 70.030998, "r_y3": 506.48914, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.40500000000003, "r_y0": 514.4244100000001, "r_x1": 286.35913, "r_y1": 514.4244100000001, "r_x2": 286.35913, "r_y2": 506.40845, "r_x3": 227.40500000000003, "r_y3": 506.40845, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 525.38339, "r_x1": 286.36328, "r_y1": 525.38339, "r_x2": 286.36328, "r_y2": 517.36743, "r_x3": 70.031006, "r_y3": 517.36743, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 536.34238, "r_x1": 112.36138000000001, "r_y1": 536.34238, "r_x2": 112.36138000000001, "r_y2": 528.32642, "r_x3": 70.031006, "r_y3": 528.32642, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 50.112007, "t": 539.59842, "r": 286.36334, "b": 591.44937, "coord_origin": "TOPLEFT" }, "confidence": 0.9394103288650513, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 547.61438, "r_x1": 65.466705, "r_y1": 547.61438, "r_x2": 65.466705, "r_y2": 539.59842, "r_x3": 50.112007, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.770828, "r_y0": 547.61438, "r_x1": 286.35873, "r_y1": 547.61438, "r_x2": 286.35873, "r_y2": 539.59842, "r_x3": 67.770828, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 558.57338, "r_x1": 136.28374, "r_y1": 558.57338, "r_x2": 136.28374, "r_y2": 550.55742, "r_x3": 70.031006, "r_y3": 550.55742, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.811, "r_y0": 558.36716, "r_x1": 286.36206, "r_y1": 558.36716, "r_x2": 286.36206, "r_y2": 550.63812, "r_x3": 138.811, "r_y3": 550.63812, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 569.32616, "r_x1": 286.36334, "r_y1": 569.32616, "r_x2": 286.36334, "r_y2": 561.5971199999999, "r_x3": 70.031006, "r_y3": 561.5971199999999, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 580.28516, "r_x1": 74.514206, "r_y1": 580.28516, "r_x2": 74.514206, "r_y2": 572.55612, "r_x3": 70.031006, "r_y3": 572.55612, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.514008, "r_y0": 580.4913799999999, "r_x1": 286.36313, "r_y1": 580.4913799999999, "r_x2": 286.36313, "r_y2": 572.47542, "r_x3": 74.514008, "r_y3": 572.47542, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 591.44937, "r_x1": 90.357834, "r_y1": 591.44937, "r_x2": 90.357834, "r_y2": 583.4334100000001, "r_x3": 70.031006, "r_y3": 583.4334100000001, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 50.112007, "t": 594.70541, "r": 286.36331, "b": 646.55737, "coord_origin": "TOPLEFT" }, "confidence": 0.9298838973045349, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 602.72137, "r_x1": 66.270439, "r_y1": 602.72137, "r_x2": 66.270439, "r_y2": 594.70541, "r_x3": 50.112007, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.695168, "r_y0": 602.72137, "r_x1": 286.35873, "r_y1": 602.72137, "r_x2": 286.35873, "r_y2": 594.70541, "r_x3": 68.695168, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 613.68037, "r_x1": 286.3631, "r_y1": 613.68037, "r_x2": 286.3631, "r_y2": 605.66441, "r_x3": 70.031006, "r_y3": 605.66441, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 624.63937, "r_x1": 286.36331, "r_y1": 624.63937, "r_x2": 286.36331, "r_y2": 616.62341, "r_x3": 70.031006, "r_y3": 616.62341, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 635.5983699999999, "r_x1": 77.500015, "r_y1": 635.5983699999999, "r_x2": 77.500015, "r_y2": 627.58241, "r_x3": 70.031006, "r_y3": 627.58241, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.920006, "r_y0": 635.39215, "r_x1": 286.3624, "r_y1": 635.39215, "r_x2": 286.3624, "r_y2": 627.6631199999999, "r_x3": 79.920006, "r_y3": 627.6631199999999, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 646.35115, "r_x1": 140.67728, "r_y1": 646.35115, "r_x2": 140.67728, "r_y2": 638.62212, "r_x3": 70.031006, "r_y3": 638.62212, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.67599, "r_y0": 646.55737, "r_x1": 264.43921, "r_y1": 646.55737, "r_x2": 264.43921, "r_y2": 638.54141, "r_x3": 140.67599, "r_y3": 638.54141, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "list_item", "bbox": { "l": 50.111992, "t": 649.81342, "r": 286.36334, "b": 679.74638, "coord_origin": "TOPLEFT" }, "confidence": 0.9115257263183594, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 657.82938, "r_x1": 66.534035, "r_y1": 657.82938, "r_x2": 66.534035, "r_y2": 649.81342, "r_x3": 50.111992, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.998329, "r_y0": 657.82938, "r_x1": 286.35873, "r_y1": 657.82938, "r_x2": 286.35873, "r_y2": 649.81342, "r_x3": 68.998329, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 668.78738, "r_x1": 93.200165, "r_y1": 668.78738, "r_x2": 93.200165, "r_y2": 660.77142, "r_x3": 70.030991, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.20243, "r_y0": 668.78738, "r_x1": 286.36334, "r_y1": 668.78738, "r_x2": 286.36334, "r_y2": 660.77142, "r_x3": 102.20243, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 679.74638, "r_x1": 171.9969, "r_y1": 679.74638, "r_x2": 171.9969, "r_y2": 671.73042, "r_x3": 70.030991, "r_y3": 671.73042, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "list_item", "bbox": { "l": 50.111992, "t": 683.00243, "r": 286.35931, "b": 712.936386, "coord_origin": "TOPLEFT" }, "confidence": 0.912230372428894, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 691.01839, "r_x1": 65.515968, "r_y1": 691.01839, "r_x2": 65.515968, "r_y2": 683.00243, "r_x3": 50.111992, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.827499, "r_y0": 691.01839, "r_x1": 286.3587, "r_y1": 691.01839, "r_x2": 286.3587, "r_y2": 683.00243, "r_x3": 67.827499, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 701.977386, "r_x1": 102.15761, "r_y1": 701.977386, "r_x2": 102.15761, "r_y2": 693.9614260000001, "r_x3": 70.030991, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.54999, "r_y0": 701.771156, "r_x1": 231.47461, "r_y1": 701.771156, "r_x2": 231.47461, "r_y2": 694.0421220000001, "r_x3": 107.54999, "r_y3": 694.0421220000001, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.47598, "r_y0": 701.977386, "r_x1": 286.35931, "r_y1": 701.977386, "r_x2": 286.35931, "r_y2": 693.9614260000001, "r_x3": 231.47598, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 712.936386, "r_x1": 97.916481, "r_y1": 712.936386, "r_x2": 97.916481, "r_y2": 704.920425, "r_x3": 70.030975, "r_y3": 704.920425, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 308.86197, "t": 75.88342000000011, "r": 545.11475, "b": 138.69335999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9389600157737732, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 83.89940999999999, "r_x1": 324.74973, "r_y1": 83.89940999999999, "r_x2": 324.74973, "r_y2": 75.88342000000011, "r_x3": 308.86197, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13382, "r_y0": 83.89940999999999, "r_x1": 545.1087, "r_y1": 83.89940999999999, "r_x2": 545.1087, "r_y2": 75.88342000000011, "r_x3": 327.13382, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 94.85741999999993, "r_x1": 545.1134, "r_y1": 94.85741999999993, "r_x2": 545.1134, "r_y2": 86.84142999999995, "r_x3": 328.78098, "r_y3": 86.84142999999995, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 105.81641000000002, "r_x1": 390.96295, "r_y1": 105.81641000000002, "r_x2": 390.96295, "r_y2": 97.80042000000003, "r_x3": 328.78098, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27008, "r_y0": 105.81641000000002, "r_x1": 435.1404099999999, "r_y1": 105.81641000000002, "r_x2": 435.1404099999999, "r_y2": 97.80042000000003, "r_x3": 400.27008, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71277, "r_y0": 105.81641000000002, "r_x1": 545.11328, "r_y1": 105.81641000000002, "r_x2": 545.11328, "r_y2": 97.80042000000003, "r_x3": 441.71277, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 116.7753899999999, "r_x1": 440.80719, "r_y1": 116.7753899999999, "r_x2": 440.80719, "r_y2": 108.75940000000003, "r_x3": 328.78098, "r_y3": 108.75940000000003, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63498, "r_y0": 116.56914999999992, "r_x1": 545.11304, "r_y1": 116.56914999999992, "r_x2": 545.11304, "r_y2": 108.84009000000003, "r_x3": 446.63498, "r_y3": 108.84009000000003, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 127.52814000000001, "r_x1": 471.13153, "r_y1": 127.52814000000001, "r_x2": 471.13153, "r_y2": 119.79907000000003, "r_x3": 328.78098, "r_y3": 119.79907000000003, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13300000000004, "r_y0": 127.73437999999999, "r_x1": 545.11475, "r_y1": 127.73437999999999, "r_x2": 545.11475, "r_y2": 119.71838000000002, "r_x3": 471.13300000000004, "r_y3": 119.71838000000002, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 138.69335999999998, "r_x1": 356.6665, "r_y1": 138.69335999999998, "r_x2": 356.6665, "r_y2": 130.67737, "r_x3": 328.78101, "r_y3": 130.67737, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "list_item", "bbox": { "l": 308.862, "t": 142.12334999999996, "r": 545.1134, "b": 172.05633999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9253129959106445, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 150.13933999999995, "r_x1": 325.24371, "r_y1": 150.13933999999995, "r_x2": 325.24371, "r_y2": 142.12334999999996, "r_x3": 308.862, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.70197, "r_y0": 150.13933999999995, "r_x1": 545.10883, "r_y1": 150.13933999999995, "r_x2": 545.10883, "r_y2": 142.12334999999996, "r_x3": 327.70197, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.09735, "r_x1": 414.44598, "r_y1": 161.09735, "r_x2": 414.44598, "r_y2": 153.08136000000002, "r_x3": 328.78101, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.82532, "r_y0": 161.09735, "r_x1": 545.1134, "r_y1": 161.09735, "r_x2": 545.1134, "r_y2": 153.08136000000002, "r_x3": 421.82532, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 172.05633999999998, "r_x1": 493.62835999999993, "r_y1": 172.05633999999998, "r_x2": 493.62835999999993, "r_y2": 164.04034000000001, "r_x3": 328.78101, "r_y3": 164.04034000000001, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 308.862, "t": 175.48632999999995, "r": 545.11353, "b": 260.21423000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9299732446670532, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.50232000000005, "r_x1": 324.26599, "r_y1": 183.50232000000005, "r_x2": 324.26599, "r_y2": 175.48632999999995, "r_x3": 308.862, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57751, "r_y0": 183.50232000000005, "r_x1": 545.10876, "r_y1": 183.50232000000005, "r_x2": 545.10876, "r_y2": 175.48632999999995, "r_x3": 326.57751, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 194.46130000000005, "r_x1": 545.11334, "r_y1": 194.46130000000005, "r_x2": 545.11334, "r_y2": 186.44530999999995, "r_x3": 328.78101, "r_y3": 186.44530999999995, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 205.42029000000002, "r_x1": 545.11346, "r_y1": 205.42029000000002, "r_x2": 545.11346, "r_y2": 197.40430000000003, "r_x3": 328.78101, "r_y3": 197.40430000000003, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 216.37927000000002, "r_x1": 545.11353, "r_y1": 216.37927000000002, "r_x2": 545.11353, "r_y2": 208.36328000000003, "r_x3": 328.78101, "r_y3": 208.36328000000003, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 227.33826, "r_x1": 479.26413, "r_y1": 227.33826, "r_x2": 479.26413, "r_y2": 219.32227, "r_x3": 328.78101, "r_y3": 219.32227, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 227.13202, "r_x1": 545.11273, "r_y1": 227.13202, "r_x2": 545.11273, "r_y2": 219.40295000000003, "r_x3": 483.11902, "r_y3": 219.40295000000003, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 238.09002999999996, "r_x1": 519.39771, "r_y1": 238.09002999999996, "r_x2": 519.39771, "r_y2": 230.36095999999998, "r_x3": 328.78101, "r_y3": 230.36095999999998, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.401, "r_y0": 238.29625999999996, "r_x1": 545.10767, "r_y1": 238.29625999999996, "r_x2": 545.10767, "r_y2": 230.28026999999997, "r_x3": 519.401, "r_y3": 230.28026999999997, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 249.25525000000005, "r_x1": 545.11328, "r_y1": 249.25525000000005, "r_x2": 545.11328, "r_y2": 241.23925999999994, "r_x3": 328.78101, "r_y3": 241.23925999999994, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 260.21423000000004, "r_x1": 333.26422, "r_y1": 260.21423000000004, "r_x2": 333.26422, "r_y2": 252.19824000000006, "r_x3": 328.78101, "r_y3": 252.19824000000006, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 308.862, "t": 263.64423, "r": 545.1142, "b": 326.45413, "coord_origin": "TOPLEFT" }, "confidence": 0.937321662902832, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 271.66022, "r_x1": 324.26477, "r_y1": 271.66022, "r_x2": 324.26477, "r_y2": 263.64423, "r_x3": 308.862, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57611, "r_y0": 271.66022, "r_x1": 545.10883, "r_y1": 271.66022, "r_x2": 545.10883, "r_y2": 263.64423, "r_x3": 326.57611, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 282.61917000000005, "r_x1": 545.1134, "r_y1": 282.61917000000005, "r_x2": 545.1134, "r_y2": 274.60321, "r_x3": 328.78101, "r_y3": 274.60321, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 293.57816, "r_x1": 545.11328, "r_y1": 293.57816, "r_x2": 545.11328, "r_y2": 285.56219, "r_x3": 328.78101, "r_y3": 285.56219, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 304.53714, "r_x1": 545.11334, "r_y1": 304.53714, "r_x2": 545.11334, "r_y2": 296.52118, "r_x3": 328.78101, "r_y3": 296.52118, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 315.49515, "r_x1": 352.84683, "r_y1": 315.49515, "r_x2": 352.84683, "r_y2": 307.47919, "r_x3": 328.78101, "r_y3": 307.47919, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.23599, "r_y0": 315.28894, "r_x1": 545.1142, "r_y1": 315.28894, "r_x2": 545.1142, "r_y2": 307.55988, "r_x3": 360.23599, "r_y3": 307.55988, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 326.24792, "r_x1": 371.02173, "r_y1": 326.24792, "r_x2": 371.02173, "r_y2": 318.51886, "r_x3": 328.78101, "r_y3": 318.51886, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.021, "r_y0": 326.45413, "r_x1": 502.26227, "r_y1": 326.45413, "r_x2": 502.26227, "r_y2": 318.43817, "r_x3": 371.021, "r_y3": 318.43817, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 308.862, "t": 329.88419, "r": 545.11609, "b": 370.77713, "coord_origin": "TOPLEFT" }, "confidence": 0.9027292728424072, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.90015, "r_x1": 323.82672, "r_y1": 337.90015, "r_x2": 323.82672, "r_y2": 329.88419, "r_x3": 308.862, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07233, "r_y0": 337.90015, "r_x1": 545.10876, "r_y1": 337.90015, "r_x2": 545.10876, "r_y2": 329.88419, "r_x3": 326.07233, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 348.85916, "r_x1": 545.11346, "r_y1": 348.85916, "r_x2": 545.11346, "r_y2": 340.8432, "r_x3": 328.78101, "r_y3": 340.8432, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 359.81815000000006, "r_x1": 382.7767, "r_y1": 359.81815000000006, "r_x2": 382.7767, "r_y2": 351.80219000000005, "r_x3": 328.78101, "r_y3": 351.80219000000005, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54102, "r_y0": 359.61194, "r_x1": 545.11609, "r_y1": 359.61194, "r_x2": 545.11609, "r_y2": 351.88287, "r_x3": 385.54102, "r_y3": 351.88287, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 370.57092, "r_x1": 443.59579, "r_y1": 370.57092, "r_x2": 443.59579, "r_y2": 362.84186, "r_x3": 328.78101, "r_y3": 362.84186, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59399, "r_y0": 370.77713, "r_x1": 534.48645, "r_y1": 370.77713, "r_x2": 534.48645, "r_y2": 362.76117, "r_x3": 443.59399, "r_y3": 362.76117, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "list_item", "bbox": { "l": 308.862, "t": 374.20618, "r": 545.11346, "b": 437.01706, "coord_origin": "TOPLEFT" }, "confidence": 0.882714569568634, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 382.22214, "r_x1": 324.60281, "r_y1": 382.22214, "r_x2": 324.60281, "r_y2": 374.20618, "r_x3": 308.862, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96487, "r_y0": 382.22214, "r_x1": 362.6604, "r_y1": 382.22214, "r_x2": 362.6604, "r_y2": 374.20618, "r_x3": 326.96487, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69479, "r_y0": 382.22214, "r_x1": 389.6134, "r_y1": 382.22214, "r_x2": 389.6134, "r_y2": 374.20618, "r_x3": 368.69479, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.6478, "r_y0": 382.22214, "r_x1": 424.56445, "r_y1": 382.22214, "r_x2": 424.56445, "r_y2": 374.20618, "r_x3": 395.6478, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.5492899999999, "r_y0": 382.22214, "r_x1": 438.0230399999999, "r_y1": 382.22214, "r_x2": 438.0230399999999, "r_y2": 374.20618, "r_x3": 431.5492899999999, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.05743, "r_y0": 382.22214, "r_x1": 488.5038799999999, "r_y1": 382.22214, "r_x2": 488.5038799999999, "r_y2": 374.20618, "r_x3": 444.05743, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.47974, "r_y0": 382.22214, "r_x1": 515.41205, "r_y1": 382.22214, "r_x2": 515.41205, "r_y2": 374.20618, "r_x3": 495.47974, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.44641, "r_y0": 382.22214, "r_x1": 545.10876, "r_y1": 382.22214, "r_x2": 545.10876, "r_y2": 374.20618, "r_x3": 521.44641, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 393.18112, "r_x1": 545.1134, "r_y1": 393.18112, "r_x2": 545.1134, "r_y2": 385.16516, "r_x3": 328.78101, "r_y3": 385.16516, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 404.14011, "r_x1": 545.11346, "r_y1": 404.14011, "r_x2": 545.11346, "r_y2": 396.12415, "r_x3": 328.78101, "r_y3": 396.12415, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 415.09909, "r_x1": 478.00881999999996, "r_y1": 415.09909, "r_x2": 478.00881999999996, "r_y2": 407.08313, "r_x3": 328.78101, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.0701, "r_y0": 415.09909, "r_x1": 491.53912, "r_y1": 415.09909, "r_x2": 491.53912, "r_y2": 407.08313, "r_x3": 484.0701, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.668, "r_y0": 414.89288, "r_x1": 545.11298, "r_y1": 414.89288, "r_x2": 545.11298, "r_y2": 407.16382, "r_x3": 494.668, "r_y3": 407.16382, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 425.85187, "r_x1": 545.11334, "r_y1": 425.85187, "r_x2": 545.11334, "r_y2": 418.12280000000004, "r_x3": 328.78101, "r_y3": 418.12280000000004, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 436.8108500000001, "r_x1": 360.83591, "r_y1": 436.8108500000001, "r_x2": 360.83591, "r_y2": 429.08179, "r_x3": 328.78101, "r_y3": 429.08179, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.836, "r_y0": 437.01706, "r_x1": 475.63287, "r_y1": 437.01706, "r_x2": 475.63287, "r_y2": 429.0011, "r_x3": 360.836, "r_y3": 429.0011, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "list_item", "bbox": { "l": 308.862, "t": 440.44611, "r": 545.11475, "b": 558.05096, "coord_origin": "TOPLEFT" }, "confidence": 0.8896440863609314, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.46207, "r_x1": 324.57407, "r_y1": 448.46207, "r_x2": 324.57407, "r_y2": 440.44611, "r_x3": 308.862, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93179, "r_y0": 448.46207, "r_x1": 545.1087, "r_y1": 448.46207, "r_x2": 545.1087, "r_y2": 440.44611, "r_x3": 326.93179, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 459.42105, "r_x1": 545.11346, "r_y1": 459.42105, "r_x2": 545.11346, "r_y2": 451.40509, "r_x3": 328.78101, "r_y3": 451.40509, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 470.38004, "r_x1": 545.11328, "r_y1": 470.38004, "r_x2": 545.11328, "r_y2": 462.36407, "r_x3": 328.78101, "r_y3": 462.36407, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 481.33902, "r_x1": 545.11328, "r_y1": 481.33902, "r_x2": 545.11328, "r_y2": 473.32306, "r_x3": 328.78101, "r_y3": 473.32306, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 492.298, "r_x1": 545.11328, "r_y1": 492.298, "r_x2": 545.11328, "r_y2": 484.28204, "r_x3": 328.78101, "r_y3": 484.28204, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 503.25699, "r_x1": 545.1134, "r_y1": 503.25699, "r_x2": 545.1134, "r_y2": 495.24103, "r_x3": 328.78101, "r_y3": 495.24103, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 514.21597, "r_x1": 545.1134, "r_y1": 514.21597, "r_x2": 545.1134, "r_y2": 506.20001, "r_x3": 328.78101, "r_y3": 506.20001, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 525.17496, "r_x1": 545.1098, "r_y1": 525.17496, "r_x2": 545.1098, "r_y2": 517.159, "r_x3": 328.78101, "r_y3": 517.159, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 536.13297, "r_x1": 434.56659, "r_y1": 536.13297, "r_x2": 434.56659, "r_y2": 528.117, "r_x3": 328.78101, "r_y3": 528.117, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86401, "r_y0": 535.9267600000001, "r_x1": 545.11115, "r_y1": 535.9267600000001, "r_x2": 545.11115, "r_y2": 528.19769, "r_x3": 437.86401, "r_y3": 528.19769, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 546.8857399999999, "r_x1": 425.73471, "r_y1": 546.8857399999999, "r_x2": 425.73471, "r_y2": 539.15671, "r_x3": 328.78101, "r_y3": 539.15671, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.73602, "r_y0": 547.09196, "r_x1": 545.11475, "r_y1": 547.09196, "r_x2": 545.11475, "r_y2": 539.076, "r_x3": 425.73602, "r_y3": 539.076, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 558.05096, "r_x1": 399.74109, "r_y1": 558.05096, "r_x2": 399.74109, "r_y2": 550.035, "r_x3": 328.78101, "r_y3": 550.035, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "list_item", "bbox": { "l": 308.862, "t": 561.481, "r": 545.1134, "b": 624.29097, "coord_origin": "TOPLEFT" }, "confidence": 0.9025435447692871, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.49696, "r_x1": 324.50351, "r_y1": 569.49696, "r_x2": 324.50351, "r_y2": 561.481, "r_x3": 308.862, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85068, "r_y0": 569.49696, "r_x1": 545.10876, "r_y1": 569.49696, "r_x2": 545.10876, "r_y2": 561.481, "r_x3": 326.85068, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 580.45596, "r_x1": 545.1134, "r_y1": 580.45596, "r_x2": 545.1134, "r_y2": 572.44, "r_x3": 328.78101, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 591.4149600000001, "r_x1": 545.11334, "r_y1": 591.4149600000001, "r_x2": 545.11334, "r_y2": 583.399, "r_x3": 328.78101, "r_y3": 583.399, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 602.37396, "r_x1": 431.61667, "r_y1": 602.37396, "r_x2": 431.61667, "r_y2": 594.358, "r_x3": 328.78101, "r_y3": 594.358, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69101000000006, "r_y0": 602.16774, "r_x1": 545.11224, "r_y1": 602.16774, "r_x2": 545.11224, "r_y2": 594.4387099999999, "r_x3": 434.69101000000006, "r_y3": 594.4387099999999, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 613.12575, "r_x1": 545.1134, "r_y1": 613.12575, "r_x2": 545.1134, "r_y2": 605.39671, "r_x3": 328.78101, "r_y3": 605.39671, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 624.08475, "r_x1": 367.8028, "r_y1": 624.08475, "r_x2": 367.8028, "r_y2": 616.35571, "r_x3": 328.78101, "r_y3": 616.35571, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.802, "r_y0": 624.29097, "r_x1": 458.69446000000005, "r_y1": 624.29097, "r_x2": 458.69446000000005, "r_y2": 616.2750100000001, "r_x3": 367.802, "r_y3": 616.2750100000001, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "list_item", "bbox": { "l": 308.862, "t": 627.72101, "r": 545.11621, "b": 668.61398, "coord_origin": "TOPLEFT" }, "confidence": 0.8777532577514648, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 635.73697, "r_x1": 324.69476, "r_y1": 635.73697, "r_x2": 324.69476, "r_y2": 627.72101, "r_x3": 308.862, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07065, "r_y0": 635.73697, "r_x1": 545.1087, "r_y1": 635.73697, "r_x2": 545.1087, "r_y2": 627.72101, "r_x3": 327.07065, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 646.69597, "r_x1": 545.11328, "r_y1": 646.69597, "r_x2": 545.11328, "r_y2": 638.68001, "r_x3": 328.78101, "r_y3": 638.68001, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 657.65497, "r_x1": 336.25003, "r_y1": 657.65497, "r_x2": 336.25003, "r_y2": 649.63901, "r_x3": 328.78101, "r_y3": 649.63901, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.10001, "r_y0": 657.44875, "r_x1": 545.11621, "r_y1": 657.44875, "r_x2": 545.11621, "r_y2": 649.71971, "r_x3": 338.10001, "r_y3": 649.71971, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 668.40775, "r_x1": 406.32245, "r_y1": 668.40775, "r_x2": 406.32245, "r_y2": 660.67871, "r_x3": 328.78101, "r_y3": 660.67871, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 668.61398, "r_x1": 521.1189, "r_y1": 668.61398, "r_x2": 521.1189, "r_y2": 660.5980099999999, "r_x3": 406.32202, "r_y3": 660.5980099999999, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "list_item", "bbox": { "l": 308.86203, "t": 672.04301, "r": 545.1134, "b": 712.935974, "coord_origin": "TOPLEFT" }, "confidence": 0.8654531240463257, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 680.05898, "r_x1": 324.71329, "r_y1": 680.05898, "r_x2": 324.71329, "r_y2": 672.04301, "r_x3": 308.86203, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09195, "r_y0": 680.05898, "r_x1": 545.10876, "r_y1": 680.05898, "r_x2": 545.10876, "r_y2": 672.04301, "r_x3": 327.09195, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 691.01797, "r_x1": 482.81488, "r_y1": 691.01797, "r_x2": 482.81488, "r_y2": 683.0020099999999, "r_x3": 328.78104, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75064, "r_y0": 691.01797, "r_x1": 545.1134, "r_y1": 691.01797, "r_x2": 545.1134, "r_y2": 683.0020099999999, "r_x3": 488.75064, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 701.976974, "r_x1": 545.11334, "r_y1": 701.976974, "r_x2": 545.11334, "r_y2": 693.961014, "r_x3": 328.78104, "r_y3": 693.961014, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 712.935974, "r_x1": 379.1543, "r_y1": 712.935974, "r_x2": 379.1543, "r_y2": 704.920013, "r_x3": 328.78104, "r_y3": 704.920013, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.61603, "r_y0": 712.729744, "r_x1": 545.10938, "r_y1": 712.729744, "r_x2": 545.10938, "r_y2": 705.00071, "r_x3": 381.61603, "r_y3": 705.00071, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "page_footer", "bbox": { "l": 295.12103, "t": 734.1325870000001, "r": 300.10233, "b": 743.0391500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.8797808885574341, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.0391500000001, "r_x1": 300.10233, "r_y1": 743.0391500000001, "r_x2": 300.10233, "r_y2": 734.1325870000001, "r_x3": 295.12103, "r_y3": 734.1325870000001, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "list_item", "id": 25, "page_no": 8, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 70.030998, "t": 75.88378999999998, "r": 286.36334, "b": 116.77575999999999, "coord_origin": "TOPLEFT" }, "confidence": 0.7310384511947632, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.89977999999996, "r_x1": 286.36334, "r_y1": 83.89977999999996, "r_x2": 286.36334, "r_y2": 75.88378999999998, "r_x3": 70.030998, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 94.85875999999996, "r_x1": 286.36331, "r_y1": 94.85875999999996, "r_x2": 286.36331, "r_y2": 86.84276999999997, "r_x3": 70.030998, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 105.81677000000002, "r_x1": 85.722198, "r_y1": 105.81677000000002, "r_x2": 85.722198, "r_y2": 97.80078000000003, "r_x3": 70.030998, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.889, "r_y0": 105.61053000000004, "r_x1": 199.93315, "r_y1": 105.61053000000004, "r_x2": 199.93315, "r_y2": 97.88147000000004, "r_x3": 87.889, "r_y3": 97.88147000000004, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.936, "r_y0": 105.81677000000002, "r_x1": 286.36313, "r_y1": 105.81677000000002, "r_x2": 286.36313, "r_y2": 97.80078000000003, "r_x3": 199.936, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 116.77575999999999, "r_x1": 221.94871999999998, "r_y1": 116.77575999999999, "r_x2": 221.94871999999998, "r_y2": 108.75977, "r_x3": 70.031006, "r_y3": 108.75977, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5" }, { "label": "list_item", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 54.595005, "t": 120.03174000000013, "r": 286.36334, "b": 149.96569999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9372755885124207, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595005, "r_y0": 128.04773, "r_x1": 65.206657, "r_y1": 128.04773, "r_x2": 65.206657, "r_y2": 120.03174000000013, "r_x3": 54.595005, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.481873, "r_y0": 128.04773, "r_x1": 286.35852, "r_y1": 128.04773, "r_x2": 286.35852, "r_y2": 120.03174000000013, "r_x3": 67.481873, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.00671, "r_x1": 179.67215, "r_y1": 139.00671, "r_x2": 179.67215, "r_y2": 130.99072, "r_x3": 70.031006, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58101, "r_y0": 139.00671, "r_x1": 286.36334, "r_y1": 139.00671, "r_x2": 286.36334, "r_y2": 130.99072, "r_x3": 185.58101, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.96569999999997, "r_x1": 113.11456, "r_y1": 149.96569999999997, "r_x2": 113.11456, "r_y2": 141.94970999999998, "r_x3": 70.031006, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34200999999999, "r_y0": 149.75946, "r_x1": 235.3082, "r_y1": 149.75946, "r_x2": 235.3082, "r_y2": 142.0304, "r_x3": 116.34200999999999, "r_y3": 142.0304, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.30701, "r_y0": 149.96569999999997, "r_x1": 267.67572, "r_y1": 149.96569999999997, "r_x2": 267.67572, "r_y2": 141.94970999999998, "r_x3": 235.30701, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3" }, { "label": "list_item", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 54.595001, "t": 153.22168, "r": 286.36301, "b": 183.15466000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9378374218940735, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 161.23766999999998, "r_x1": 65.103195, "r_y1": 161.23766999999998, "r_x2": 65.103195, "r_y2": 153.22168, "r_x3": 54.595001, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.356239, "r_y0": 161.23766999999998, "r_x1": 218.77876, "r_y1": 161.23766999999998, "r_x2": 218.77876, "r_y2": 153.22168, "r_x3": 67.356239, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.97999999999996, "r_y0": 161.03143, "r_x1": 286.36301, "r_y1": 161.03143, "r_x2": 286.36301, "r_y2": 153.30237, "r_x3": 220.97999999999996, "r_y3": 153.30237, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 171.99041999999997, "r_x1": 125.26401000000001, "r_y1": 171.99041999999997, "r_x2": 125.26401000000001, "r_y2": 164.26135, "r_x3": 70.030991, "r_y3": 164.26135, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26098999999999, "r_y0": 172.19665999999995, "r_x1": 286.36029, "r_y1": 172.19665999999995, "r_x2": 286.36029, "r_y2": 164.18066, "r_x3": 125.26098999999999, "r_y3": 164.18066, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 183.15466000000004, "r_x1": 97.916496, "r_y1": 183.15466000000004, "r_x2": 97.916496, "r_y2": 175.13867000000005, "r_x3": 70.030991, "r_y3": 175.13867000000005, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2" }, { "label": "list_item", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 54.59499, "t": 186.41063999999994, "r": 286.36401, "b": 227.30358999999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9648825526237488, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 194.42664000000002, "r_x1": 65.806984, "r_y1": 194.42664000000002, "r_x2": 65.806984, "r_y2": 186.41063999999994, "r_x3": 54.59499, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.210922, "r_y0": 194.42664000000002, "r_x1": 286.36401, "r_y1": 194.42664000000002, "r_x2": 286.36401, "r_y2": 186.41063999999994, "r_x3": 68.210922, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 205.38562000000002, "r_x1": 286.36331, "r_y1": 205.38562000000002, "r_x2": 286.36331, "r_y2": 197.36963000000003, "r_x3": 70.030983, "r_y3": 197.36963000000003, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 216.3446, "r_x1": 286.36334, "r_y1": 216.3446, "r_x2": 286.36334, "r_y2": 208.32861000000003, "r_x3": 70.030983, "r_y3": 208.32861000000003, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 227.30358999999999, "r_x1": 245.83519, "r_y1": 227.30358999999999, "r_x2": 245.83519, "r_y2": 219.2876, "r_x3": 70.030983, "r_y3": 219.2876, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2" }, { "label": "list_item", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 54.594982, "t": 230.55957, "r": 286.36334, "b": 271.45154, "coord_origin": "TOPLEFT" }, "confidence": 0.9620943069458008, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594982, "r_y0": 238.57556, "r_x1": 65.381134, "r_y1": 238.57556, "r_x2": 65.381134, "r_y2": 230.55957, "r_x3": 54.594982, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693779, "r_y0": 238.57556, "r_x1": 286.35849, "r_y1": 238.57556, "r_x2": 286.35849, "r_y2": 230.55957, "r_x3": 67.693779, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 249.53454999999997, "r_x1": 286.36334, "r_y1": 249.53454999999997, "r_x2": 286.36334, "r_y2": 241.51855, "r_x3": 70.030983, "r_y3": 241.51855, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 260.49255000000005, "r_x1": 108.39821, "r_y1": 260.49255000000005, "r_x2": 108.39821, "r_y2": 252.47655999999995, "r_x3": 70.030983, "r_y3": 252.47655999999995, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64498000000002, "r_y0": 260.28632000000005, "r_x1": 286.3595, "r_y1": 260.28632000000005, "r_x2": 286.3595, "r_y2": 252.55724999999995, "r_x3": 110.64498000000002, "r_y3": 252.55724999999995, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 271.24530000000004, "r_x1": 140.57861, "r_y1": 271.24530000000004, "r_x2": 140.57861, "r_y2": 263.51624000000004, "r_x3": 70.030983, "r_y3": 263.51624000000004, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.57797, "r_y0": 271.45154, "r_x1": 266.47522, "r_y1": 271.45154, "r_x2": 266.47522, "r_y2": 263.43555000000003, "r_x3": 140.57797, "r_y3": 263.43555000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2" }, { "label": "list_item", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 54.594971, "t": 274.70758, "r": 286.36676, "b": 315.6004899999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9555517435073853, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594971, "r_y0": 282.72351, "r_x1": 64.848648, "r_y1": 282.72351, "r_x2": 64.848648, "r_y2": 274.70758, "r_x3": 54.594971, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.047119, "r_y0": 282.72351, "r_x1": 286.36676, "r_y1": 282.72351, "r_x2": 286.36676, "r_y2": 274.70758, "r_x3": 67.047119, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 293.68253, "r_x1": 179.57349, "r_y1": 293.68253, "r_x2": 179.57349, "r_y2": 285.66655999999995, "r_x3": 70.030975, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.01559, "r_y0": 293.68253, "r_x1": 194.4846, "r_y1": 293.68253, "r_x2": 194.4846, "r_y2": 285.66655999999995, "r_x3": 187.01559, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04398, "r_y0": 293.47632, "r_x1": 286.36304, "r_y1": 293.47632, "r_x2": 286.36304, "r_y2": 285.74725, "r_x3": 198.04398, "r_y3": 285.74725, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 304.43530000000004, "r_x1": 260.19937, "r_y1": 304.43530000000004, "r_x2": 260.19937, "r_y2": 296.70624, "r_x3": 70.030975, "r_y3": 296.70624, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.198, "r_y0": 304.64151, "r_x1": 286.36197, "r_y1": 304.64151, "r_x2": 286.36197, "r_y2": 296.62555, "r_x3": 260.198, "r_y3": 296.62555, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 315.6004899999999, "r_x1": 142.74849, "r_y1": 315.6004899999999, "r_x2": 142.74849, "r_y2": 307.5845299999999, "r_x3": 70.030991, "r_y3": 307.5845299999999, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2" }, { "label": "list_item", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 54.59499, "t": 318.85654, "r": 286.36319, "b": 348.78952, "coord_origin": "TOPLEFT" }, "confidence": 0.9479843378067017, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 326.8725, "r_x1": 65.61586, "r_y1": 326.8725, "r_x2": 65.61586, "r_y2": 318.85654, "r_x3": 54.59499, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.978821, "r_y0": 326.8725, "r_x1": 199.492, "r_y1": 326.8725, "r_x2": 199.492, "r_y2": 318.85654, "r_x3": 67.978821, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.98792, "r_y0": 326.8725, "r_x1": 286.35849, "r_y1": 326.8725, "r_x2": 286.35849, "r_y2": 318.85654, "r_x3": 206.98792, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 337.83051, "r_x1": 176.28284, "r_y1": 337.83051, "r_x2": 176.28284, "r_y2": 329.8145400000001, "r_x3": 70.030991, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.60416, "r_y0": 337.83051, "r_x1": 190.07317, "r_y1": 337.83051, "r_x2": 190.07317, "r_y2": 329.8145400000001, "r_x3": 182.60416, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28299, "r_y0": 337.62429999999995, "r_x1": 286.36319, "r_y1": 337.62429999999995, "r_x2": 286.36319, "r_y2": 329.89522999999997, "r_x3": 193.28299, "r_y3": 329.89522999999997, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 348.58331, "r_x1": 206.34717, "r_y1": 348.58331, "r_x2": 206.34717, "r_y2": 340.85425, "r_x3": 70.030991, "r_y3": 340.85425, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.34599, "r_y0": 348.78952, "r_x1": 274.82239, "r_y1": 348.78952, "r_x2": 274.82239, "r_y2": 340.77356, "r_x3": 206.34599, "r_y3": 340.77356, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2" }, { "label": "list_item", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 54.594986000000006, "t": 352.0455600000001, "r": 286.36331, "b": 403.89749, "coord_origin": "TOPLEFT" }, "confidence": 0.9484425187110901, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594986000000006, "r_y0": 360.06152, "r_x1": 65.04657, "r_y1": 360.06152, "r_x2": 65.04657, "r_y2": 352.0455600000001, "r_x3": 54.594986000000006, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.287483, "r_y0": 360.06152, "r_x1": 286.35849, "r_y1": 360.06152, "r_x2": 286.35849, "r_y2": 352.0455600000001, "r_x3": 67.287483, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 371.02054, "r_x1": 234.12507999999997, "r_y1": 371.02054, "r_x2": 234.12507999999997, "r_y2": 363.00458, "r_x3": 70.030983, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05186, "r_y0": 371.02054, "r_x1": 286.36331, "r_y1": 371.02054, "r_x2": 286.36331, "r_y2": 363.00458, "r_x3": 240.05186, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 381.97952, "r_x1": 286.36331, "r_y1": 381.97952, "r_x2": 286.36331, "r_y2": 373.96356, "r_x3": 70.030983, "r_y3": 373.96356, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 392.93851, "r_x1": 286.36331, "r_y1": 392.93851, "r_x2": 286.36331, "r_y2": 384.92255, "r_x3": 70.030983, "r_y3": 384.92255, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 403.89749, "r_x1": 114.57605, "r_y1": 403.89749, "r_x2": 114.57605, "r_y2": 395.88153, "r_x3": 70.030983, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.80399000000001, "r_y0": 403.69128, "r_x1": 186.7287, "r_y1": 403.69128, "r_x2": 186.7287, "r_y2": 395.96222, "r_x3": 117.80399000000001, "r_y3": 395.96222, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.728, "r_y0": 403.89749, "r_x1": 243.00113999999996, "r_y1": 403.89749, "r_x2": 243.00113999999996, "r_y2": 395.88153, "r_x3": 186.728, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1" }, { "label": "list_item", "id": 10, "page_no": 8, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 54.595001, "t": 407.15253000000007, "r": 286.35989, "b": 437.08646000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9330756664276123, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 415.1684900000001, "r_x1": 65.334427, "r_y1": 415.1684900000001, "r_x2": 65.334427, "r_y2": 407.15253000000007, "r_x3": 54.595001, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.637054, "r_y0": 415.1684900000001, "r_x1": 286.35852, "r_y1": 415.1684900000001, "r_x2": 286.35852, "r_y2": 407.15253000000007, "r_x3": 67.637054, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 426.12747, "r_x1": 147.13306, "r_y1": 426.12747, "r_x2": 147.13306, "r_y2": 418.11151, "r_x3": 70.030998, "r_y3": 418.11151, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15601, "r_y0": 425.92126, "r_x1": 286.35989, "r_y1": 425.92126, "r_x2": 286.35989, "r_y2": 418.1922, "r_x3": 149.15601, "r_y3": 418.1922, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.88025, "r_x1": 213.48445, "r_y1": 436.88025, "r_x2": 213.48445, "r_y2": 429.15118, "r_x3": 70.031006, "r_y3": 429.15118, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.483, "r_y0": 437.08646000000005, "r_x1": 261.04083, "r_y1": 437.08646000000005, "r_x2": 261.04083, "r_y2": 429.07050000000004, "r_x3": 213.483, "r_y3": 429.07050000000004, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1" }, { "label": "list_item", "id": 14, "page_no": 8, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 50.112, "t": 440.3424999999999, "r": 286.36334, "b": 481.23544, "coord_origin": "TOPLEFT" }, "confidence": 0.9274735450744629, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 448.3584599999999, "r_x1": 65.399307, "r_y1": 448.3584599999999, "r_x2": 65.399307, "r_y2": 440.3424999999999, "r_x3": 50.112, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693321, "r_y0": 448.3584599999999, "r_x1": 286.3587, "r_y1": 448.3584599999999, "r_x2": 286.3587, "r_y2": 440.3424999999999, "r_x3": 67.693321, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 459.31747, "r_x1": 202.74268, "r_y1": 459.31747, "r_x2": 202.74268, "r_y2": 451.30151, "r_x3": 70.030998, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.00122, "r_y0": 459.31747, "r_x1": 286.36331, "r_y1": 459.31747, "r_x2": 286.36331, "r_y2": 451.30151, "r_x3": 209.00122, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 470.27646, "r_x1": 286.36334, "r_y1": 470.27646, "r_x2": 286.36334, "r_y2": 462.2605, "r_x3": 70.030998, "r_y3": 462.2605, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 481.23544, "r_x1": 141.86981, "r_y1": 481.23544, "r_x2": 141.86981, "r_y2": 473.21948, "r_x3": 70.030998, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.097, "r_y0": 481.02924, "r_x1": 166.01561, "r_y1": 481.02924, "r_x2": 166.01561, "r_y2": 473.30017, "r_x3": 145.097, "r_y3": 473.30017, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.015, "r_y0": 481.23544, "r_x1": 259.90216, "r_y1": 481.23544, "r_x2": 259.90216, "r_y2": 473.21948, "r_x3": 166.015, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2" }, { "label": "list_item", "id": 11, "page_no": 8, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.112, "t": 484.49048, "r": 286.36331, "b": 536.34238, "coord_origin": "TOPLEFT" }, "confidence": 0.9299950003623962, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.50644, "r_x1": 66.033806, "r_y1": 492.50644, "r_x2": 66.033806, "r_y2": 484.49048, "r_x3": 50.112, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.423035, "r_y0": 492.50644, "r_x1": 286.35873, "r_y1": 492.50644, "r_x2": 286.35873, "r_y2": 484.49048, "r_x3": 68.423035, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 503.46542, "r_x1": 286.36331, "r_y1": 503.46542, "r_x2": 286.36331, "r_y2": 495.44946, "r_x3": 70.030998, "r_y3": 495.44946, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 514.2182, "r_x1": 227.40926, "r_y1": 514.2182, "r_x2": 227.40926, "r_y2": 506.48914, "r_x3": 70.030998, "r_y3": 506.48914, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.40500000000003, "r_y0": 514.4244100000001, "r_x1": 286.35913, "r_y1": 514.4244100000001, "r_x2": 286.35913, "r_y2": 506.40845, "r_x3": 227.40500000000003, "r_y3": 506.40845, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 525.38339, "r_x1": 286.36328, "r_y1": 525.38339, "r_x2": 286.36328, "r_y2": 517.36743, "r_x3": 70.031006, "r_y3": 517.36743, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 536.34238, "r_x1": 112.36138000000001, "r_y1": 536.34238, "r_x2": 112.36138000000001, "r_y2": 528.32642, "r_x3": 70.031006, "r_y3": 528.32642, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2" }, { "label": "list_item", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.112007, "t": 539.59842, "r": 286.36334, "b": 591.44937, "coord_origin": "TOPLEFT" }, "confidence": 0.9394103288650513, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 547.61438, "r_x1": 65.466705, "r_y1": 547.61438, "r_x2": 65.466705, "r_y2": 539.59842, "r_x3": 50.112007, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.770828, "r_y0": 547.61438, "r_x1": 286.35873, "r_y1": 547.61438, "r_x2": 286.35873, "r_y2": 539.59842, "r_x3": 67.770828, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 558.57338, "r_x1": 136.28374, "r_y1": 558.57338, "r_x2": 136.28374, "r_y2": 550.55742, "r_x3": 70.031006, "r_y3": 550.55742, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.811, "r_y0": 558.36716, "r_x1": 286.36206, "r_y1": 558.36716, "r_x2": 286.36206, "r_y2": 550.63812, "r_x3": 138.811, "r_y3": 550.63812, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 569.32616, "r_x1": 286.36334, "r_y1": 569.32616, "r_x2": 286.36334, "r_y2": 561.5971199999999, "r_x3": 70.031006, "r_y3": 561.5971199999999, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 580.28516, "r_x1": 74.514206, "r_y1": 580.28516, "r_x2": 74.514206, "r_y2": 572.55612, "r_x3": 70.031006, "r_y3": 572.55612, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.514008, "r_y0": 580.4913799999999, "r_x1": 286.36313, "r_y1": 580.4913799999999, "r_x2": 286.36313, "r_y2": 572.47542, "r_x3": 74.514008, "r_y3": 572.47542, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 591.44937, "r_x1": 90.357834, "r_y1": 591.44937, "r_x2": 90.357834, "r_y2": 583.4334100000001, "r_x3": 70.031006, "r_y3": 583.4334100000001, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2" }, { "label": "list_item", "id": 13, "page_no": 8, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.112007, "t": 594.70541, "r": 286.36331, "b": 646.55737, "coord_origin": "TOPLEFT" }, "confidence": 0.9298838973045349, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 602.72137, "r_x1": 66.270439, "r_y1": 602.72137, "r_x2": 66.270439, "r_y2": 594.70541, "r_x3": 50.112007, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.695168, "r_y0": 602.72137, "r_x1": 286.35873, "r_y1": 602.72137, "r_x2": 286.35873, "r_y2": 594.70541, "r_x3": 68.695168, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 613.68037, "r_x1": 286.3631, "r_y1": 613.68037, "r_x2": 286.3631, "r_y2": 605.66441, "r_x3": 70.031006, "r_y3": 605.66441, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 624.63937, "r_x1": 286.36331, "r_y1": 624.63937, "r_x2": 286.36331, "r_y2": 616.62341, "r_x3": 70.031006, "r_y3": 616.62341, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 635.5983699999999, "r_x1": 77.500015, "r_y1": 635.5983699999999, "r_x2": 77.500015, "r_y2": 627.58241, "r_x3": 70.031006, "r_y3": 627.58241, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.920006, "r_y0": 635.39215, "r_x1": 286.3624, "r_y1": 635.39215, "r_x2": 286.3624, "r_y2": 627.6631199999999, "r_x3": 79.920006, "r_y3": 627.6631199999999, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 646.35115, "r_x1": 140.67728, "r_y1": 646.35115, "r_x2": 140.67728, "r_y2": 638.62212, "r_x3": 70.031006, "r_y3": 638.62212, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.67599, "r_y0": 646.55737, "r_x1": 264.43921, "r_y1": 646.55737, "r_x2": 264.43921, "r_y2": 638.54141, "r_x3": 140.67599, "r_y3": 638.54141, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2" }, { "label": "list_item", "id": 17, "page_no": 8, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 50.111992, "t": 649.81342, "r": 286.36334, "b": 679.74638, "coord_origin": "TOPLEFT" }, "confidence": 0.9115257263183594, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 657.82938, "r_x1": 66.534035, "r_y1": 657.82938, "r_x2": 66.534035, "r_y2": 649.81342, "r_x3": 50.111992, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.998329, "r_y0": 657.82938, "r_x1": 286.35873, "r_y1": 657.82938, "r_x2": 286.35873, "r_y2": 649.81342, "r_x3": 68.998329, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 668.78738, "r_x1": 93.200165, "r_y1": 668.78738, "r_x2": 93.200165, "r_y2": 660.77142, "r_x3": 70.030991, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.20243, "r_y0": 668.78738, "r_x1": 286.36334, "r_y1": 668.78738, "r_x2": 286.36334, "r_y2": 660.77142, "r_x3": 102.20243, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 679.74638, "r_x1": 171.9969, "r_y1": 679.74638, "r_x2": 171.9969, "r_y2": 671.73042, "r_x3": 70.030991, "r_y3": 671.73042, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2" }, { "label": "list_item", "id": 16, "page_no": 8, "cluster": { "id": 16, "label": "list_item", "bbox": { "l": 50.111992, "t": 683.00243, "r": 286.35931, "b": 712.936386, "coord_origin": "TOPLEFT" }, "confidence": 0.912230372428894, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 691.01839, "r_x1": 65.515968, "r_y1": 691.01839, "r_x2": 65.515968, "r_y2": 683.00243, "r_x3": 50.111992, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.827499, "r_y0": 691.01839, "r_x1": 286.3587, "r_y1": 691.01839, "r_x2": 286.3587, "r_y2": 683.00243, "r_x3": 67.827499, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 701.977386, "r_x1": 102.15761, "r_y1": 701.977386, "r_x2": 102.15761, "r_y2": 693.9614260000001, "r_x3": 70.030991, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.54999, "r_y0": 701.771156, "r_x1": 231.47461, "r_y1": 701.771156, "r_x2": 231.47461, "r_y2": 694.0421220000001, "r_x3": 107.54999, "r_y3": 694.0421220000001, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.47598, "r_y0": 701.977386, "r_x1": 286.35931, "r_y1": 701.977386, "r_x2": 286.35931, "r_y2": 693.9614260000001, "r_x3": 231.47598, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 712.936386, "r_x1": 97.916481, "r_y1": 712.936386, "r_x2": 97.916481, "r_y2": 704.920425, "r_x3": 70.030975, "r_y3": 704.920425, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6" }, { "label": "list_item", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86197, "t": 75.88342000000011, "r": 545.11475, "b": 138.69335999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9389600157737732, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 83.89940999999999, "r_x1": 324.74973, "r_y1": 83.89940999999999, "r_x2": 324.74973, "r_y2": 75.88342000000011, "r_x3": 308.86197, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13382, "r_y0": 83.89940999999999, "r_x1": 545.1087, "r_y1": 83.89940999999999, "r_x2": 545.1087, "r_y2": 75.88342000000011, "r_x3": 327.13382, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 94.85741999999993, "r_x1": 545.1134, "r_y1": 94.85741999999993, "r_x2": 545.1134, "r_y2": 86.84142999999995, "r_x3": 328.78098, "r_y3": 86.84142999999995, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 105.81641000000002, "r_x1": 390.96295, "r_y1": 105.81641000000002, "r_x2": 390.96295, "r_y2": 97.80042000000003, "r_x3": 328.78098, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27008, "r_y0": 105.81641000000002, "r_x1": 435.1404099999999, "r_y1": 105.81641000000002, "r_x2": 435.1404099999999, "r_y2": 97.80042000000003, "r_x3": 400.27008, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71277, "r_y0": 105.81641000000002, "r_x1": 545.11328, "r_y1": 105.81641000000002, "r_x2": 545.11328, "r_y2": 97.80042000000003, "r_x3": 441.71277, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 116.7753899999999, "r_x1": 440.80719, "r_y1": 116.7753899999999, "r_x2": 440.80719, "r_y2": 108.75940000000003, "r_x3": 328.78098, "r_y3": 108.75940000000003, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63498, "r_y0": 116.56914999999992, "r_x1": 545.11304, "r_y1": 116.56914999999992, "r_x2": 545.11304, "r_y2": 108.84009000000003, "r_x3": 446.63498, "r_y3": 108.84009000000003, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 127.52814000000001, "r_x1": 471.13153, "r_y1": 127.52814000000001, "r_x2": 471.13153, "r_y2": 119.79907000000003, "r_x3": 328.78098, "r_y3": 119.79907000000003, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13300000000004, "r_y0": 127.73437999999999, "r_x1": 545.11475, "r_y1": 127.73437999999999, "r_x2": 545.11475, "r_y2": 119.71838000000002, "r_x3": 471.13300000000004, "r_y3": 119.71838000000002, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 138.69335999999998, "r_x1": 356.6665, "r_y1": 138.69335999999998, "r_x2": 356.6665, "r_y2": 130.67737, "r_x3": 328.78101, "r_y3": 130.67737, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4" }, { "label": "list_item", "id": 15, "page_no": 8, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.862, "t": 142.12334999999996, "r": 545.1134, "b": 172.05633999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9253129959106445, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 150.13933999999995, "r_x1": 325.24371, "r_y1": 150.13933999999995, "r_x2": 325.24371, "r_y2": 142.12334999999996, "r_x3": 308.862, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.70197, "r_y0": 150.13933999999995, "r_x1": 545.10883, "r_y1": 150.13933999999995, "r_x2": 545.10883, "r_y2": 142.12334999999996, "r_x3": 327.70197, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.09735, "r_x1": 414.44598, "r_y1": 161.09735, "r_x2": 414.44598, "r_y2": 153.08136000000002, "r_x3": 328.78101, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.82532, "r_y0": 161.09735, "r_x1": 545.1134, "r_y1": 161.09735, "r_x2": 545.1134, "r_y2": 153.08136000000002, "r_x3": 421.82532, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 172.05633999999998, "r_x1": 493.62835999999993, "r_y1": 172.05633999999998, "r_x2": 493.62835999999993, "r_y2": 164.04034000000001, "r_x3": 328.78101, "r_y3": 164.04034000000001, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3" }, { "label": "list_item", "id": 12, "page_no": 8, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 308.862, "t": 175.48632999999995, "r": 545.11353, "b": 260.21423000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9299732446670532, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.50232000000005, "r_x1": 324.26599, "r_y1": 183.50232000000005, "r_x2": 324.26599, "r_y2": 175.48632999999995, "r_x3": 308.862, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57751, "r_y0": 183.50232000000005, "r_x1": 545.10876, "r_y1": 183.50232000000005, "r_x2": 545.10876, "r_y2": 175.48632999999995, "r_x3": 326.57751, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 194.46130000000005, "r_x1": 545.11334, "r_y1": 194.46130000000005, "r_x2": 545.11334, "r_y2": 186.44530999999995, "r_x3": 328.78101, "r_y3": 186.44530999999995, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 205.42029000000002, "r_x1": 545.11346, "r_y1": 205.42029000000002, "r_x2": 545.11346, "r_y2": 197.40430000000003, "r_x3": 328.78101, "r_y3": 197.40430000000003, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 216.37927000000002, "r_x1": 545.11353, "r_y1": 216.37927000000002, "r_x2": 545.11353, "r_y2": 208.36328000000003, "r_x3": 328.78101, "r_y3": 208.36328000000003, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 227.33826, "r_x1": 479.26413, "r_y1": 227.33826, "r_x2": 479.26413, "r_y2": 219.32227, "r_x3": 328.78101, "r_y3": 219.32227, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 227.13202, "r_x1": 545.11273, "r_y1": 227.13202, "r_x2": 545.11273, "r_y2": 219.40295000000003, "r_x3": 483.11902, "r_y3": 219.40295000000003, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 238.09002999999996, "r_x1": 519.39771, "r_y1": 238.09002999999996, "r_x2": 519.39771, "r_y2": 230.36095999999998, "r_x3": 328.78101, "r_y3": 230.36095999999998, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.401, "r_y0": 238.29625999999996, "r_x1": 545.10767, "r_y1": 238.29625999999996, "r_x2": 545.10767, "r_y2": 230.28026999999997, "r_x3": 519.401, "r_y3": 230.28026999999997, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 249.25525000000005, "r_x1": 545.11328, "r_y1": 249.25525000000005, "r_x2": 545.11328, "r_y2": 241.23925999999994, "r_x3": 328.78101, "r_y3": 241.23925999999994, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 260.21423000000004, "r_x1": 333.26422, "r_y1": 260.21423000000004, "r_x2": 333.26422, "r_y2": 252.19824000000006, "r_x3": 328.78101, "r_y3": 252.19824000000006, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 308.862, "t": 263.64423, "r": 545.1142, "b": 326.45413, "coord_origin": "TOPLEFT" }, "confidence": 0.937321662902832, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 271.66022, "r_x1": 324.26477, "r_y1": 271.66022, "r_x2": 324.26477, "r_y2": 263.64423, "r_x3": 308.862, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57611, "r_y0": 271.66022, "r_x1": 545.10883, "r_y1": 271.66022, "r_x2": 545.10883, "r_y2": 263.64423, "r_x3": 326.57611, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 282.61917000000005, "r_x1": 545.1134, "r_y1": 282.61917000000005, "r_x2": 545.1134, "r_y2": 274.60321, "r_x3": 328.78101, "r_y3": 274.60321, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 293.57816, "r_x1": 545.11328, "r_y1": 293.57816, "r_x2": 545.11328, "r_y2": 285.56219, "r_x3": 328.78101, "r_y3": 285.56219, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 304.53714, "r_x1": 545.11334, "r_y1": 304.53714, "r_x2": 545.11334, "r_y2": 296.52118, "r_x3": 328.78101, "r_y3": 296.52118, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 315.49515, "r_x1": 352.84683, "r_y1": 315.49515, "r_x2": 352.84683, "r_y2": 307.47919, "r_x3": 328.78101, "r_y3": 307.47919, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.23599, "r_y0": 315.28894, "r_x1": 545.1142, "r_y1": 315.28894, "r_x2": 545.1142, "r_y2": 307.55988, "r_x3": 360.23599, "r_y3": 307.55988, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 326.24792, "r_x1": 371.02173, "r_y1": 326.24792, "r_x2": 371.02173, "r_y2": 318.51886, "r_x3": 328.78101, "r_y3": 318.51886, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.021, "r_y0": 326.45413, "r_x1": 502.26227, "r_y1": 326.45413, "r_x2": 502.26227, "r_y2": 318.43817, "r_x3": 371.021, "r_y3": 318.43817, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1" }, { "label": "list_item", "id": 18, "page_no": 8, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.862, "t": 329.88419, "r": 545.11609, "b": 370.77713, "coord_origin": "TOPLEFT" }, "confidence": 0.9027292728424072, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.90015, "r_x1": 323.82672, "r_y1": 337.90015, "r_x2": 323.82672, "r_y2": 329.88419, "r_x3": 308.862, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07233, "r_y0": 337.90015, "r_x1": 545.10876, "r_y1": 337.90015, "r_x2": 545.10876, "r_y2": 329.88419, "r_x3": 326.07233, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 348.85916, "r_x1": 545.11346, "r_y1": 348.85916, "r_x2": 545.11346, "r_y2": 340.8432, "r_x3": 328.78101, "r_y3": 340.8432, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 359.81815000000006, "r_x1": 382.7767, "r_y1": 359.81815000000006, "r_x2": 382.7767, "r_y2": 351.80219000000005, "r_x3": 328.78101, "r_y3": 351.80219000000005, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54102, "r_y0": 359.61194, "r_x1": 545.11609, "r_y1": 359.61194, "r_x2": 545.11609, "r_y2": 351.88287, "r_x3": 385.54102, "r_y3": 351.88287, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 370.57092, "r_x1": 443.59579, "r_y1": 370.57092, "r_x2": 443.59579, "r_y2": 362.84186, "r_x3": 328.78101, "r_y3": 362.84186, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59399, "r_y0": 370.77713, "r_x1": 534.48645, "r_y1": 370.77713, "r_x2": 534.48645, "r_y2": 362.76117, "r_x3": 443.59399, "r_y3": 362.76117, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2" }, { "label": "list_item", "id": 21, "page_no": 8, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.862, "t": 374.20618, "r": 545.11346, "b": 437.01706, "coord_origin": "TOPLEFT" }, "confidence": 0.882714569568634, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 382.22214, "r_x1": 324.60281, "r_y1": 382.22214, "r_x2": 324.60281, "r_y2": 374.20618, "r_x3": 308.862, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96487, "r_y0": 382.22214, "r_x1": 362.6604, "r_y1": 382.22214, "r_x2": 362.6604, "r_y2": 374.20618, "r_x3": 326.96487, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69479, "r_y0": 382.22214, "r_x1": 389.6134, "r_y1": 382.22214, "r_x2": 389.6134, "r_y2": 374.20618, "r_x3": 368.69479, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.6478, "r_y0": 382.22214, "r_x1": 424.56445, "r_y1": 382.22214, "r_x2": 424.56445, "r_y2": 374.20618, "r_x3": 395.6478, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.5492899999999, "r_y0": 382.22214, "r_x1": 438.0230399999999, "r_y1": 382.22214, "r_x2": 438.0230399999999, "r_y2": 374.20618, "r_x3": 431.5492899999999, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.05743, "r_y0": 382.22214, "r_x1": 488.5038799999999, "r_y1": 382.22214, "r_x2": 488.5038799999999, "r_y2": 374.20618, "r_x3": 444.05743, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.47974, "r_y0": 382.22214, "r_x1": 515.41205, "r_y1": 382.22214, "r_x2": 515.41205, "r_y2": 374.20618, "r_x3": 495.47974, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.44641, "r_y0": 382.22214, "r_x1": 545.10876, "r_y1": 382.22214, "r_x2": 545.10876, "r_y2": 374.20618, "r_x3": 521.44641, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 393.18112, "r_x1": 545.1134, "r_y1": 393.18112, "r_x2": 545.1134, "r_y2": 385.16516, "r_x3": 328.78101, "r_y3": 385.16516, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 404.14011, "r_x1": 545.11346, "r_y1": 404.14011, "r_x2": 545.11346, "r_y2": 396.12415, "r_x3": 328.78101, "r_y3": 396.12415, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 415.09909, "r_x1": 478.00881999999996, "r_y1": 415.09909, "r_x2": 478.00881999999996, "r_y2": 407.08313, "r_x3": 328.78101, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.0701, "r_y0": 415.09909, "r_x1": 491.53912, "r_y1": 415.09909, "r_x2": 491.53912, "r_y2": 407.08313, "r_x3": 484.0701, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.668, "r_y0": 414.89288, "r_x1": 545.11298, "r_y1": 414.89288, "r_x2": 545.11298, "r_y2": 407.16382, "r_x3": 494.668, "r_y3": 407.16382, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 425.85187, "r_x1": 545.11334, "r_y1": 425.85187, "r_x2": 545.11334, "r_y2": 418.12280000000004, "r_x3": 328.78101, "r_y3": 418.12280000000004, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 436.8108500000001, "r_x1": 360.83591, "r_y1": 436.8108500000001, "r_x2": 360.83591, "r_y2": 429.08179, "r_x3": 328.78101, "r_y3": 429.08179, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.836, "r_y0": 437.01706, "r_x1": 475.63287, "r_y1": 437.01706, "r_x2": 475.63287, "r_y2": 429.0011, "r_x3": 360.836, "r_y3": 429.0011, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1" }, { "label": "list_item", "id": 20, "page_no": 8, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 308.862, "t": 440.44611, "r": 545.11475, "b": 558.05096, "coord_origin": "TOPLEFT" }, "confidence": 0.8896440863609314, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.46207, "r_x1": 324.57407, "r_y1": 448.46207, "r_x2": 324.57407, "r_y2": 440.44611, "r_x3": 308.862, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93179, "r_y0": 448.46207, "r_x1": 545.1087, "r_y1": 448.46207, "r_x2": 545.1087, "r_y2": 440.44611, "r_x3": 326.93179, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 459.42105, "r_x1": 545.11346, "r_y1": 459.42105, "r_x2": 545.11346, "r_y2": 451.40509, "r_x3": 328.78101, "r_y3": 451.40509, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 470.38004, "r_x1": 545.11328, "r_y1": 470.38004, "r_x2": 545.11328, "r_y2": 462.36407, "r_x3": 328.78101, "r_y3": 462.36407, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 481.33902, "r_x1": 545.11328, "r_y1": 481.33902, "r_x2": 545.11328, "r_y2": 473.32306, "r_x3": 328.78101, "r_y3": 473.32306, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 492.298, "r_x1": 545.11328, "r_y1": 492.298, "r_x2": 545.11328, "r_y2": 484.28204, "r_x3": 328.78101, "r_y3": 484.28204, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 503.25699, "r_x1": 545.1134, "r_y1": 503.25699, "r_x2": 545.1134, "r_y2": 495.24103, "r_x3": 328.78101, "r_y3": 495.24103, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 514.21597, "r_x1": 545.1134, "r_y1": 514.21597, "r_x2": 545.1134, "r_y2": 506.20001, "r_x3": 328.78101, "r_y3": 506.20001, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 525.17496, "r_x1": 545.1098, "r_y1": 525.17496, "r_x2": 545.1098, "r_y2": 517.159, "r_x3": 328.78101, "r_y3": 517.159, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 536.13297, "r_x1": 434.56659, "r_y1": 536.13297, "r_x2": 434.56659, "r_y2": 528.117, "r_x3": 328.78101, "r_y3": 528.117, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86401, "r_y0": 535.9267600000001, "r_x1": 545.11115, "r_y1": 535.9267600000001, "r_x2": 545.11115, "r_y2": 528.19769, "r_x3": 437.86401, "r_y3": 528.19769, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 546.8857399999999, "r_x1": 425.73471, "r_y1": 546.8857399999999, "r_x2": 425.73471, "r_y2": 539.15671, "r_x3": 328.78101, "r_y3": 539.15671, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.73602, "r_y0": 547.09196, "r_x1": 545.11475, "r_y1": 547.09196, "r_x2": 545.11475, "r_y2": 539.076, "r_x3": 425.73602, "r_y3": 539.076, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 558.05096, "r_x1": 399.74109, "r_y1": 558.05096, "r_x2": 399.74109, "r_y2": 550.035, "r_x3": 328.78101, "r_y3": 550.035, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6" }, { "label": "list_item", "id": 19, "page_no": 8, "cluster": { "id": 19, "label": "list_item", "bbox": { "l": 308.862, "t": 561.481, "r": 545.1134, "b": 624.29097, "coord_origin": "TOPLEFT" }, "confidence": 0.9025435447692871, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.49696, "r_x1": 324.50351, "r_y1": 569.49696, "r_x2": 324.50351, "r_y2": 561.481, "r_x3": 308.862, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85068, "r_y0": 569.49696, "r_x1": 545.10876, "r_y1": 569.49696, "r_x2": 545.10876, "r_y2": 561.481, "r_x3": 326.85068, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 580.45596, "r_x1": 545.1134, "r_y1": 580.45596, "r_x2": 545.1134, "r_y2": 572.44, "r_x3": 328.78101, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 591.4149600000001, "r_x1": 545.11334, "r_y1": 591.4149600000001, "r_x2": 545.11334, "r_y2": 583.399, "r_x3": 328.78101, "r_y3": 583.399, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 602.37396, "r_x1": 431.61667, "r_y1": 602.37396, "r_x2": 431.61667, "r_y2": 594.358, "r_x3": 328.78101, "r_y3": 594.358, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69101000000006, "r_y0": 602.16774, "r_x1": 545.11224, "r_y1": 602.16774, "r_x2": 545.11224, "r_y2": 594.4387099999999, "r_x3": 434.69101000000006, "r_y3": 594.4387099999999, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 613.12575, "r_x1": 545.1134, "r_y1": 613.12575, "r_x2": 545.1134, "r_y2": 605.39671, "r_x3": 328.78101, "r_y3": 605.39671, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 624.08475, "r_x1": 367.8028, "r_y1": 624.08475, "r_x2": 367.8028, "r_y2": 616.35571, "r_x3": 328.78101, "r_y3": 616.35571, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.802, "r_y0": 624.29097, "r_x1": 458.69446000000005, "r_y1": 624.29097, "r_x2": 458.69446000000005, "r_y2": 616.2750100000001, "r_x3": 367.802, "r_y3": 616.2750100000001, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1" }, { "label": "list_item", "id": 23, "page_no": 8, "cluster": { "id": 23, "label": "list_item", "bbox": { "l": 308.862, "t": 627.72101, "r": 545.11621, "b": 668.61398, "coord_origin": "TOPLEFT" }, "confidence": 0.8777532577514648, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 635.73697, "r_x1": 324.69476, "r_y1": 635.73697, "r_x2": 324.69476, "r_y2": 627.72101, "r_x3": 308.862, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07065, "r_y0": 635.73697, "r_x1": 545.1087, "r_y1": 635.73697, "r_x2": 545.1087, "r_y2": 627.72101, "r_x3": 327.07065, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 646.69597, "r_x1": 545.11328, "r_y1": 646.69597, "r_x2": 545.11328, "r_y2": 638.68001, "r_x3": 328.78101, "r_y3": 638.68001, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 657.65497, "r_x1": 336.25003, "r_y1": 657.65497, "r_x2": 336.25003, "r_y2": 649.63901, "r_x3": 328.78101, "r_y3": 649.63901, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.10001, "r_y0": 657.44875, "r_x1": 545.11621, "r_y1": 657.44875, "r_x2": 545.11621, "r_y2": 649.71971, "r_x3": 338.10001, "r_y3": 649.71971, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 668.40775, "r_x1": 406.32245, "r_y1": 668.40775, "r_x2": 406.32245, "r_y2": 660.67871, "r_x3": 328.78101, "r_y3": 660.67871, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 668.61398, "r_x1": 521.1189, "r_y1": 668.61398, "r_x2": 521.1189, "r_y2": 660.5980099999999, "r_x3": 406.32202, "r_y3": 660.5980099999999, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3" }, { "label": "list_item", "id": 24, "page_no": 8, "cluster": { "id": 24, "label": "list_item", "bbox": { "l": 308.86203, "t": 672.04301, "r": 545.1134, "b": 712.935974, "coord_origin": "TOPLEFT" }, "confidence": 0.8654531240463257, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 680.05898, "r_x1": 324.71329, "r_y1": 680.05898, "r_x2": 324.71329, "r_y2": 672.04301, "r_x3": 308.86203, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09195, "r_y0": 680.05898, "r_x1": 545.10876, "r_y1": 680.05898, "r_x2": 545.10876, "r_y2": 672.04301, "r_x3": 327.09195, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 691.01797, "r_x1": 482.81488, "r_y1": 691.01797, "r_x2": 482.81488, "r_y2": 683.0020099999999, "r_x3": 328.78104, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75064, "r_y0": 691.01797, "r_x1": 545.1134, "r_y1": 691.01797, "r_x2": 545.1134, "r_y2": 683.0020099999999, "r_x3": 488.75064, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 701.976974, "r_x1": 545.11334, "r_y1": 701.976974, "r_x2": 545.11334, "r_y2": 693.961014, "r_x3": 328.78104, "r_y3": 693.961014, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 712.935974, "r_x1": 379.1543, "r_y1": 712.935974, "r_x2": 379.1543, "r_y2": 704.920013, "r_x3": 328.78104, "r_y3": 704.920013, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.61603, "r_y0": 712.729744, "r_x1": 545.10938, "r_y1": 712.729744, "r_x2": 545.10938, "r_y2": 705.00071, "r_x3": 381.61603, "r_y3": 705.00071, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on" }, { "label": "page_footer", "id": 22, "page_no": 8, "cluster": { "id": 22, "label": "page_footer", "bbox": { "l": 295.12103, "t": 734.1325870000001, "r": 300.10233, "b": 743.0391500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.8797808885574341, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.0391500000001, "r_x1": 300.10233, "r_y1": 743.0391500000001, "r_x2": 300.10233, "r_y2": 734.1325870000001, "r_x3": 295.12103, "r_y3": 734.1325870000001, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" } ], "body": [ { "label": "list_item", "id": 25, "page_no": 8, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 70.030998, "t": 75.88378999999998, "r": 286.36334, "b": 116.77575999999999, "coord_origin": "TOPLEFT" }, "confidence": 0.7310384511947632, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.89977999999996, "r_x1": 286.36334, "r_y1": 83.89977999999996, "r_x2": 286.36334, "r_y2": 75.88378999999998, "r_x3": 70.030998, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 94.85875999999996, "r_x1": 286.36331, "r_y1": 94.85875999999996, "r_x2": 286.36331, "r_y2": 86.84276999999997, "r_x3": 70.030998, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 105.81677000000002, "r_x1": 85.722198, "r_y1": 105.81677000000002, "r_x2": 85.722198, "r_y2": 97.80078000000003, "r_x3": 70.030998, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.889, "r_y0": 105.61053000000004, "r_x1": 199.93315, "r_y1": 105.61053000000004, "r_x2": 199.93315, "r_y2": 97.88147000000004, "r_x3": 87.889, "r_y3": 97.88147000000004, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.936, "r_y0": 105.81677000000002, "r_x1": 286.36313, "r_y1": 105.81677000000002, "r_x2": 286.36313, "r_y2": 97.80078000000003, "r_x3": 199.936, "r_y3": 97.80078000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 116.77575999999999, "r_x1": 221.94871999999998, "r_y1": 116.77575999999999, "r_x2": 221.94871999999998, "r_y2": 108.75977, "r_x3": 70.031006, "r_y3": 108.75977, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5" }, { "label": "list_item", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 54.595005, "t": 120.03174000000013, "r": 286.36334, "b": 149.96569999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9372755885124207, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595005, "r_y0": 128.04773, "r_x1": 65.206657, "r_y1": 128.04773, "r_x2": 65.206657, "r_y2": 120.03174000000013, "r_x3": 54.595005, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.481873, "r_y0": 128.04773, "r_x1": 286.35852, "r_y1": 128.04773, "r_x2": 286.35852, "r_y2": 120.03174000000013, "r_x3": 67.481873, "r_y3": 120.03174000000013, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.00671, "r_x1": 179.67215, "r_y1": 139.00671, "r_x2": 179.67215, "r_y2": 130.99072, "r_x3": 70.031006, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58101, "r_y0": 139.00671, "r_x1": 286.36334, "r_y1": 139.00671, "r_x2": 286.36334, "r_y2": 130.99072, "r_x3": 185.58101, "r_y3": 130.99072, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.96569999999997, "r_x1": 113.11456, "r_y1": 149.96569999999997, "r_x2": 113.11456, "r_y2": 141.94970999999998, "r_x3": 70.031006, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34200999999999, "r_y0": 149.75946, "r_x1": 235.3082, "r_y1": 149.75946, "r_x2": 235.3082, "r_y2": 142.0304, "r_x3": 116.34200999999999, "r_y3": 142.0304, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.30701, "r_y0": 149.96569999999997, "r_x1": 267.67572, "r_y1": 149.96569999999997, "r_x2": 267.67572, "r_y2": 141.94970999999998, "r_x3": 235.30701, "r_y3": 141.94970999999998, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3" }, { "label": "list_item", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 54.595001, "t": 153.22168, "r": 286.36301, "b": 183.15466000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9378374218940735, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 161.23766999999998, "r_x1": 65.103195, "r_y1": 161.23766999999998, "r_x2": 65.103195, "r_y2": 153.22168, "r_x3": 54.595001, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.356239, "r_y0": 161.23766999999998, "r_x1": 218.77876, "r_y1": 161.23766999999998, "r_x2": 218.77876, "r_y2": 153.22168, "r_x3": 67.356239, "r_y3": 153.22168, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.97999999999996, "r_y0": 161.03143, "r_x1": 286.36301, "r_y1": 161.03143, "r_x2": 286.36301, "r_y2": 153.30237, "r_x3": 220.97999999999996, "r_y3": 153.30237, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 171.99041999999997, "r_x1": 125.26401000000001, "r_y1": 171.99041999999997, "r_x2": 125.26401000000001, "r_y2": 164.26135, "r_x3": 70.030991, "r_y3": 164.26135, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26098999999999, "r_y0": 172.19665999999995, "r_x1": 286.36029, "r_y1": 172.19665999999995, "r_x2": 286.36029, "r_y2": 164.18066, "r_x3": 125.26098999999999, "r_y3": 164.18066, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 183.15466000000004, "r_x1": 97.916496, "r_y1": 183.15466000000004, "r_x2": 97.916496, "r_y2": 175.13867000000005, "r_x3": 70.030991, "r_y3": 175.13867000000005, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2" }, { "label": "list_item", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 54.59499, "t": 186.41063999999994, "r": 286.36401, "b": 227.30358999999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9648825526237488, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 194.42664000000002, "r_x1": 65.806984, "r_y1": 194.42664000000002, "r_x2": 65.806984, "r_y2": 186.41063999999994, "r_x3": 54.59499, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.210922, "r_y0": 194.42664000000002, "r_x1": 286.36401, "r_y1": 194.42664000000002, "r_x2": 286.36401, "r_y2": 186.41063999999994, "r_x3": 68.210922, "r_y3": 186.41063999999994, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 205.38562000000002, "r_x1": 286.36331, "r_y1": 205.38562000000002, "r_x2": 286.36331, "r_y2": 197.36963000000003, "r_x3": 70.030983, "r_y3": 197.36963000000003, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 216.3446, "r_x1": 286.36334, "r_y1": 216.3446, "r_x2": 286.36334, "r_y2": 208.32861000000003, "r_x3": 70.030983, "r_y3": 208.32861000000003, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 227.30358999999999, "r_x1": 245.83519, "r_y1": 227.30358999999999, "r_x2": 245.83519, "r_y2": 219.2876, "r_x3": 70.030983, "r_y3": 219.2876, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2" }, { "label": "list_item", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 54.594982, "t": 230.55957, "r": 286.36334, "b": 271.45154, "coord_origin": "TOPLEFT" }, "confidence": 0.9620943069458008, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594982, "r_y0": 238.57556, "r_x1": 65.381134, "r_y1": 238.57556, "r_x2": 65.381134, "r_y2": 230.55957, "r_x3": 54.594982, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693779, "r_y0": 238.57556, "r_x1": 286.35849, "r_y1": 238.57556, "r_x2": 286.35849, "r_y2": 230.55957, "r_x3": 67.693779, "r_y3": 230.55957, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 249.53454999999997, "r_x1": 286.36334, "r_y1": 249.53454999999997, "r_x2": 286.36334, "r_y2": 241.51855, "r_x3": 70.030983, "r_y3": 241.51855, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 260.49255000000005, "r_x1": 108.39821, "r_y1": 260.49255000000005, "r_x2": 108.39821, "r_y2": 252.47655999999995, "r_x3": 70.030983, "r_y3": 252.47655999999995, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64498000000002, "r_y0": 260.28632000000005, "r_x1": 286.3595, "r_y1": 260.28632000000005, "r_x2": 286.3595, "r_y2": 252.55724999999995, "r_x3": 110.64498000000002, "r_y3": 252.55724999999995, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 271.24530000000004, "r_x1": 140.57861, "r_y1": 271.24530000000004, "r_x2": 140.57861, "r_y2": 263.51624000000004, "r_x3": 70.030983, "r_y3": 263.51624000000004, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.57797, "r_y0": 271.45154, "r_x1": 266.47522, "r_y1": 271.45154, "r_x2": 266.47522, "r_y2": 263.43555000000003, "r_x3": 140.57797, "r_y3": 263.43555000000003, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2" }, { "label": "list_item", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 54.594971, "t": 274.70758, "r": 286.36676, "b": 315.6004899999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9555517435073853, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594971, "r_y0": 282.72351, "r_x1": 64.848648, "r_y1": 282.72351, "r_x2": 64.848648, "r_y2": 274.70758, "r_x3": 54.594971, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.047119, "r_y0": 282.72351, "r_x1": 286.36676, "r_y1": 282.72351, "r_x2": 286.36676, "r_y2": 274.70758, "r_x3": 67.047119, "r_y3": 274.70758, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 293.68253, "r_x1": 179.57349, "r_y1": 293.68253, "r_x2": 179.57349, "r_y2": 285.66655999999995, "r_x3": 70.030975, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.01559, "r_y0": 293.68253, "r_x1": 194.4846, "r_y1": 293.68253, "r_x2": 194.4846, "r_y2": 285.66655999999995, "r_x3": 187.01559, "r_y3": 285.66655999999995, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04398, "r_y0": 293.47632, "r_x1": 286.36304, "r_y1": 293.47632, "r_x2": 286.36304, "r_y2": 285.74725, "r_x3": 198.04398, "r_y3": 285.74725, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 304.43530000000004, "r_x1": 260.19937, "r_y1": 304.43530000000004, "r_x2": 260.19937, "r_y2": 296.70624, "r_x3": 70.030975, "r_y3": 296.70624, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.198, "r_y0": 304.64151, "r_x1": 286.36197, "r_y1": 304.64151, "r_x2": 286.36197, "r_y2": 296.62555, "r_x3": 260.198, "r_y3": 296.62555, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 315.6004899999999, "r_x1": 142.74849, "r_y1": 315.6004899999999, "r_x2": 142.74849, "r_y2": 307.5845299999999, "r_x3": 70.030991, "r_y3": 307.5845299999999, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2" }, { "label": "list_item", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 54.59499, "t": 318.85654, "r": 286.36319, "b": 348.78952, "coord_origin": "TOPLEFT" }, "confidence": 0.9479843378067017, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59499, "r_y0": 326.8725, "r_x1": 65.61586, "r_y1": 326.8725, "r_x2": 65.61586, "r_y2": 318.85654, "r_x3": 54.59499, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.978821, "r_y0": 326.8725, "r_x1": 199.492, "r_y1": 326.8725, "r_x2": 199.492, "r_y2": 318.85654, "r_x3": 67.978821, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.98792, "r_y0": 326.8725, "r_x1": 286.35849, "r_y1": 326.8725, "r_x2": 286.35849, "r_y2": 318.85654, "r_x3": 206.98792, "r_y3": 318.85654, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 337.83051, "r_x1": 176.28284, "r_y1": 337.83051, "r_x2": 176.28284, "r_y2": 329.8145400000001, "r_x3": 70.030991, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.60416, "r_y0": 337.83051, "r_x1": 190.07317, "r_y1": 337.83051, "r_x2": 190.07317, "r_y2": 329.8145400000001, "r_x3": 182.60416, "r_y3": 329.8145400000001, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28299, "r_y0": 337.62429999999995, "r_x1": 286.36319, "r_y1": 337.62429999999995, "r_x2": 286.36319, "r_y2": 329.89522999999997, "r_x3": 193.28299, "r_y3": 329.89522999999997, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 348.58331, "r_x1": 206.34717, "r_y1": 348.58331, "r_x2": 206.34717, "r_y2": 340.85425, "r_x3": 70.030991, "r_y3": 340.85425, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.34599, "r_y0": 348.78952, "r_x1": 274.82239, "r_y1": 348.78952, "r_x2": 274.82239, "r_y2": 340.77356, "r_x3": 206.34599, "r_y3": 340.77356, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2" }, { "label": "list_item", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 54.594986000000006, "t": 352.0455600000001, "r": 286.36331, "b": 403.89749, "coord_origin": "TOPLEFT" }, "confidence": 0.9484425187110901, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.594986000000006, "r_y0": 360.06152, "r_x1": 65.04657, "r_y1": 360.06152, "r_x2": 65.04657, "r_y2": 352.0455600000001, "r_x3": 54.594986000000006, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.287483, "r_y0": 360.06152, "r_x1": 286.35849, "r_y1": 360.06152, "r_x2": 286.35849, "r_y2": 352.0455600000001, "r_x3": 67.287483, "r_y3": 352.0455600000001, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 371.02054, "r_x1": 234.12507999999997, "r_y1": 371.02054, "r_x2": 234.12507999999997, "r_y2": 363.00458, "r_x3": 70.030983, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05186, "r_y0": 371.02054, "r_x1": 286.36331, "r_y1": 371.02054, "r_x2": 286.36331, "r_y2": 363.00458, "r_x3": 240.05186, "r_y3": 363.00458, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 381.97952, "r_x1": 286.36331, "r_y1": 381.97952, "r_x2": 286.36331, "r_y2": 373.96356, "r_x3": 70.030983, "r_y3": 373.96356, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 392.93851, "r_x1": 286.36331, "r_y1": 392.93851, "r_x2": 286.36331, "r_y2": 384.92255, "r_x3": 70.030983, "r_y3": 384.92255, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030983, "r_y0": 403.89749, "r_x1": 114.57605, "r_y1": 403.89749, "r_x2": 114.57605, "r_y2": 395.88153, "r_x3": 70.030983, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.80399000000001, "r_y0": 403.69128, "r_x1": 186.7287, "r_y1": 403.69128, "r_x2": 186.7287, "r_y2": 395.96222, "r_x3": 117.80399000000001, "r_y3": 395.96222, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.728, "r_y0": 403.89749, "r_x1": 243.00113999999996, "r_y1": 403.89749, "r_x2": 243.00113999999996, "r_y2": 395.88153, "r_x3": 186.728, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1" }, { "label": "list_item", "id": 10, "page_no": 8, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 54.595001, "t": 407.15253000000007, "r": 286.35989, "b": 437.08646000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9330756664276123, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.595001, "r_y0": 415.1684900000001, "r_x1": 65.334427, "r_y1": 415.1684900000001, "r_x2": 65.334427, "r_y2": 407.15253000000007, "r_x3": 54.595001, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.637054, "r_y0": 415.1684900000001, "r_x1": 286.35852, "r_y1": 415.1684900000001, "r_x2": 286.35852, "r_y2": 407.15253000000007, "r_x3": 67.637054, "r_y3": 407.15253000000007, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 426.12747, "r_x1": 147.13306, "r_y1": 426.12747, "r_x2": 147.13306, "r_y2": 418.11151, "r_x3": 70.030998, "r_y3": 418.11151, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15601, "r_y0": 425.92126, "r_x1": 286.35989, "r_y1": 425.92126, "r_x2": 286.35989, "r_y2": 418.1922, "r_x3": 149.15601, "r_y3": 418.1922, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.88025, "r_x1": 213.48445, "r_y1": 436.88025, "r_x2": 213.48445, "r_y2": 429.15118, "r_x3": 70.031006, "r_y3": 429.15118, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.483, "r_y0": 437.08646000000005, "r_x1": 261.04083, "r_y1": 437.08646000000005, "r_x2": 261.04083, "r_y2": 429.07050000000004, "r_x3": 213.483, "r_y3": 429.07050000000004, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1" }, { "label": "list_item", "id": 14, "page_no": 8, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 50.112, "t": 440.3424999999999, "r": 286.36334, "b": 481.23544, "coord_origin": "TOPLEFT" }, "confidence": 0.9274735450744629, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 448.3584599999999, "r_x1": 65.399307, "r_y1": 448.3584599999999, "r_x2": 65.399307, "r_y2": 440.3424999999999, "r_x3": 50.112, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.693321, "r_y0": 448.3584599999999, "r_x1": 286.3587, "r_y1": 448.3584599999999, "r_x2": 286.3587, "r_y2": 440.3424999999999, "r_x3": 67.693321, "r_y3": 440.3424999999999, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 459.31747, "r_x1": 202.74268, "r_y1": 459.31747, "r_x2": 202.74268, "r_y2": 451.30151, "r_x3": 70.030998, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.00122, "r_y0": 459.31747, "r_x1": 286.36331, "r_y1": 459.31747, "r_x2": 286.36331, "r_y2": 451.30151, "r_x3": 209.00122, "r_y3": 451.30151, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 470.27646, "r_x1": 286.36334, "r_y1": 470.27646, "r_x2": 286.36334, "r_y2": 462.2605, "r_x3": 70.030998, "r_y3": 462.2605, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 481.23544, "r_x1": 141.86981, "r_y1": 481.23544, "r_x2": 141.86981, "r_y2": 473.21948, "r_x3": 70.030998, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.097, "r_y0": 481.02924, "r_x1": 166.01561, "r_y1": 481.02924, "r_x2": 166.01561, "r_y2": 473.30017, "r_x3": 145.097, "r_y3": 473.30017, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.015, "r_y0": 481.23544, "r_x1": 259.90216, "r_y1": 481.23544, "r_x2": 259.90216, "r_y2": 473.21948, "r_x3": 166.015, "r_y3": 473.21948, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2" }, { "label": "list_item", "id": 11, "page_no": 8, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.112, "t": 484.49048, "r": 286.36331, "b": 536.34238, "coord_origin": "TOPLEFT" }, "confidence": 0.9299950003623962, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.50644, "r_x1": 66.033806, "r_y1": 492.50644, "r_x2": 66.033806, "r_y2": 484.49048, "r_x3": 50.112, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.423035, "r_y0": 492.50644, "r_x1": 286.35873, "r_y1": 492.50644, "r_x2": 286.35873, "r_y2": 484.49048, "r_x3": 68.423035, "r_y3": 484.49048, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 503.46542, "r_x1": 286.36331, "r_y1": 503.46542, "r_x2": 286.36331, "r_y2": 495.44946, "r_x3": 70.030998, "r_y3": 495.44946, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 514.2182, "r_x1": 227.40926, "r_y1": 514.2182, "r_x2": 227.40926, "r_y2": 506.48914, "r_x3": 70.030998, "r_y3": 506.48914, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.40500000000003, "r_y0": 514.4244100000001, "r_x1": 286.35913, "r_y1": 514.4244100000001, "r_x2": 286.35913, "r_y2": 506.40845, "r_x3": 227.40500000000003, "r_y3": 506.40845, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 525.38339, "r_x1": 286.36328, "r_y1": 525.38339, "r_x2": 286.36328, "r_y2": 517.36743, "r_x3": 70.031006, "r_y3": 517.36743, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 536.34238, "r_x1": 112.36138000000001, "r_y1": 536.34238, "r_x2": 112.36138000000001, "r_y2": 528.32642, "r_x3": 70.031006, "r_y3": 528.32642, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2" }, { "label": "list_item", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.112007, "t": 539.59842, "r": 286.36334, "b": 591.44937, "coord_origin": "TOPLEFT" }, "confidence": 0.9394103288650513, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 547.61438, "r_x1": 65.466705, "r_y1": 547.61438, "r_x2": 65.466705, "r_y2": 539.59842, "r_x3": 50.112007, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.770828, "r_y0": 547.61438, "r_x1": 286.35873, "r_y1": 547.61438, "r_x2": 286.35873, "r_y2": 539.59842, "r_x3": 67.770828, "r_y3": 539.59842, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 558.57338, "r_x1": 136.28374, "r_y1": 558.57338, "r_x2": 136.28374, "r_y2": 550.55742, "r_x3": 70.031006, "r_y3": 550.55742, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.811, "r_y0": 558.36716, "r_x1": 286.36206, "r_y1": 558.36716, "r_x2": 286.36206, "r_y2": 550.63812, "r_x3": 138.811, "r_y3": 550.63812, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 569.32616, "r_x1": 286.36334, "r_y1": 569.32616, "r_x2": 286.36334, "r_y2": 561.5971199999999, "r_x3": 70.031006, "r_y3": 561.5971199999999, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 580.28516, "r_x1": 74.514206, "r_y1": 580.28516, "r_x2": 74.514206, "r_y2": 572.55612, "r_x3": 70.031006, "r_y3": 572.55612, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.514008, "r_y0": 580.4913799999999, "r_x1": 286.36313, "r_y1": 580.4913799999999, "r_x2": 286.36313, "r_y2": 572.47542, "r_x3": 74.514008, "r_y3": 572.47542, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 591.44937, "r_x1": 90.357834, "r_y1": 591.44937, "r_x2": 90.357834, "r_y2": 583.4334100000001, "r_x3": 70.031006, "r_y3": 583.4334100000001, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2" }, { "label": "list_item", "id": 13, "page_no": 8, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.112007, "t": 594.70541, "r": 286.36331, "b": 646.55737, "coord_origin": "TOPLEFT" }, "confidence": 0.9298838973045349, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 602.72137, "r_x1": 66.270439, "r_y1": 602.72137, "r_x2": 66.270439, "r_y2": 594.70541, "r_x3": 50.112007, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.695168, "r_y0": 602.72137, "r_x1": 286.35873, "r_y1": 602.72137, "r_x2": 286.35873, "r_y2": 594.70541, "r_x3": 68.695168, "r_y3": 594.70541, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 613.68037, "r_x1": 286.3631, "r_y1": 613.68037, "r_x2": 286.3631, "r_y2": 605.66441, "r_x3": 70.031006, "r_y3": 605.66441, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 624.63937, "r_x1": 286.36331, "r_y1": 624.63937, "r_x2": 286.36331, "r_y2": 616.62341, "r_x3": 70.031006, "r_y3": 616.62341, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 635.5983699999999, "r_x1": 77.500015, "r_y1": 635.5983699999999, "r_x2": 77.500015, "r_y2": 627.58241, "r_x3": 70.031006, "r_y3": 627.58241, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.920006, "r_y0": 635.39215, "r_x1": 286.3624, "r_y1": 635.39215, "r_x2": 286.3624, "r_y2": 627.6631199999999, "r_x3": 79.920006, "r_y3": 627.6631199999999, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 646.35115, "r_x1": 140.67728, "r_y1": 646.35115, "r_x2": 140.67728, "r_y2": 638.62212, "r_x3": 70.031006, "r_y3": 638.62212, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.67599, "r_y0": 646.55737, "r_x1": 264.43921, "r_y1": 646.55737, "r_x2": 264.43921, "r_y2": 638.54141, "r_x3": 140.67599, "r_y3": 638.54141, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2" }, { "label": "list_item", "id": 17, "page_no": 8, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 50.111992, "t": 649.81342, "r": 286.36334, "b": 679.74638, "coord_origin": "TOPLEFT" }, "confidence": 0.9115257263183594, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 657.82938, "r_x1": 66.534035, "r_y1": 657.82938, "r_x2": 66.534035, "r_y2": 649.81342, "r_x3": 50.111992, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.998329, "r_y0": 657.82938, "r_x1": 286.35873, "r_y1": 657.82938, "r_x2": 286.35873, "r_y2": 649.81342, "r_x3": 68.998329, "r_y3": 649.81342, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 668.78738, "r_x1": 93.200165, "r_y1": 668.78738, "r_x2": 93.200165, "r_y2": 660.77142, "r_x3": 70.030991, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.20243, "r_y0": 668.78738, "r_x1": 286.36334, "r_y1": 668.78738, "r_x2": 286.36334, "r_y2": 660.77142, "r_x3": 102.20243, "r_y3": 660.77142, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 679.74638, "r_x1": 171.9969, "r_y1": 679.74638, "r_x2": 171.9969, "r_y2": 671.73042, "r_x3": 70.030991, "r_y3": 671.73042, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2" }, { "label": "list_item", "id": 16, "page_no": 8, "cluster": { "id": 16, "label": "list_item", "bbox": { "l": 50.111992, "t": 683.00243, "r": 286.35931, "b": 712.936386, "coord_origin": "TOPLEFT" }, "confidence": 0.912230372428894, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111992, "r_y0": 691.01839, "r_x1": 65.515968, "r_y1": 691.01839, "r_x2": 65.515968, "r_y2": 683.00243, "r_x3": 50.111992, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.827499, "r_y0": 691.01839, "r_x1": 286.3587, "r_y1": 691.01839, "r_x2": 286.3587, "r_y2": 683.00243, "r_x3": 67.827499, "r_y3": 683.00243, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030991, "r_y0": 701.977386, "r_x1": 102.15761, "r_y1": 701.977386, "r_x2": 102.15761, "r_y2": 693.9614260000001, "r_x3": 70.030991, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.54999, "r_y0": 701.771156, "r_x1": 231.47461, "r_y1": 701.771156, "r_x2": 231.47461, "r_y2": 694.0421220000001, "r_x3": 107.54999, "r_y3": 694.0421220000001, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.47598, "r_y0": 701.977386, "r_x1": 286.35931, "r_y1": 701.977386, "r_x2": 286.35931, "r_y2": 693.9614260000001, "r_x3": 231.47598, "r_y3": 693.9614260000001, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030975, "r_y0": 712.936386, "r_x1": 97.916481, "r_y1": 712.936386, "r_x2": 97.916481, "r_y2": 704.920425, "r_x3": 70.030975, "r_y3": 704.920425, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6" }, { "label": "list_item", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86197, "t": 75.88342000000011, "r": 545.11475, "b": 138.69335999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9389600157737732, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 83.89940999999999, "r_x1": 324.74973, "r_y1": 83.89940999999999, "r_x2": 324.74973, "r_y2": 75.88342000000011, "r_x3": 308.86197, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13382, "r_y0": 83.89940999999999, "r_x1": 545.1087, "r_y1": 83.89940999999999, "r_x2": 545.1087, "r_y2": 75.88342000000011, "r_x3": 327.13382, "r_y3": 75.88342000000011, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 94.85741999999993, "r_x1": 545.1134, "r_y1": 94.85741999999993, "r_x2": 545.1134, "r_y2": 86.84142999999995, "r_x3": 328.78098, "r_y3": 86.84142999999995, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 105.81641000000002, "r_x1": 390.96295, "r_y1": 105.81641000000002, "r_x2": 390.96295, "r_y2": 97.80042000000003, "r_x3": 328.78098, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27008, "r_y0": 105.81641000000002, "r_x1": 435.1404099999999, "r_y1": 105.81641000000002, "r_x2": 435.1404099999999, "r_y2": 97.80042000000003, "r_x3": 400.27008, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71277, "r_y0": 105.81641000000002, "r_x1": 545.11328, "r_y1": 105.81641000000002, "r_x2": 545.11328, "r_y2": 97.80042000000003, "r_x3": 441.71277, "r_y3": 97.80042000000003, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 116.7753899999999, "r_x1": 440.80719, "r_y1": 116.7753899999999, "r_x2": 440.80719, "r_y2": 108.75940000000003, "r_x3": 328.78098, "r_y3": 108.75940000000003, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63498, "r_y0": 116.56914999999992, "r_x1": 545.11304, "r_y1": 116.56914999999992, "r_x2": 545.11304, "r_y2": 108.84009000000003, "r_x3": 446.63498, "r_y3": 108.84009000000003, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78098, "r_y0": 127.52814000000001, "r_x1": 471.13153, "r_y1": 127.52814000000001, "r_x2": 471.13153, "r_y2": 119.79907000000003, "r_x3": 328.78098, "r_y3": 119.79907000000003, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13300000000004, "r_y0": 127.73437999999999, "r_x1": 545.11475, "r_y1": 127.73437999999999, "r_x2": 545.11475, "r_y2": 119.71838000000002, "r_x3": 471.13300000000004, "r_y3": 119.71838000000002, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 138.69335999999998, "r_x1": 356.6665, "r_y1": 138.69335999999998, "r_x2": 356.6665, "r_y2": 130.67737, "r_x3": 328.78101, "r_y3": 130.67737, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4" }, { "label": "list_item", "id": 15, "page_no": 8, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.862, "t": 142.12334999999996, "r": 545.1134, "b": 172.05633999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9253129959106445, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 150.13933999999995, "r_x1": 325.24371, "r_y1": 150.13933999999995, "r_x2": 325.24371, "r_y2": 142.12334999999996, "r_x3": 308.862, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.70197, "r_y0": 150.13933999999995, "r_x1": 545.10883, "r_y1": 150.13933999999995, "r_x2": 545.10883, "r_y2": 142.12334999999996, "r_x3": 327.70197, "r_y3": 142.12334999999996, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.09735, "r_x1": 414.44598, "r_y1": 161.09735, "r_x2": 414.44598, "r_y2": 153.08136000000002, "r_x3": 328.78101, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.82532, "r_y0": 161.09735, "r_x1": 545.1134, "r_y1": 161.09735, "r_x2": 545.1134, "r_y2": 153.08136000000002, "r_x3": 421.82532, "r_y3": 153.08136000000002, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 172.05633999999998, "r_x1": 493.62835999999993, "r_y1": 172.05633999999998, "r_x2": 493.62835999999993, "r_y2": 164.04034000000001, "r_x3": 328.78101, "r_y3": 164.04034000000001, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3" }, { "label": "list_item", "id": 12, "page_no": 8, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 308.862, "t": 175.48632999999995, "r": 545.11353, "b": 260.21423000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9299732446670532, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.50232000000005, "r_x1": 324.26599, "r_y1": 183.50232000000005, "r_x2": 324.26599, "r_y2": 175.48632999999995, "r_x3": 308.862, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57751, "r_y0": 183.50232000000005, "r_x1": 545.10876, "r_y1": 183.50232000000005, "r_x2": 545.10876, "r_y2": 175.48632999999995, "r_x3": 326.57751, "r_y3": 175.48632999999995, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 194.46130000000005, "r_x1": 545.11334, "r_y1": 194.46130000000005, "r_x2": 545.11334, "r_y2": 186.44530999999995, "r_x3": 328.78101, "r_y3": 186.44530999999995, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 205.42029000000002, "r_x1": 545.11346, "r_y1": 205.42029000000002, "r_x2": 545.11346, "r_y2": 197.40430000000003, "r_x3": 328.78101, "r_y3": 197.40430000000003, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 216.37927000000002, "r_x1": 545.11353, "r_y1": 216.37927000000002, "r_x2": 545.11353, "r_y2": 208.36328000000003, "r_x3": 328.78101, "r_y3": 208.36328000000003, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 227.33826, "r_x1": 479.26413, "r_y1": 227.33826, "r_x2": 479.26413, "r_y2": 219.32227, "r_x3": 328.78101, "r_y3": 219.32227, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.11902, "r_y0": 227.13202, "r_x1": 545.11273, "r_y1": 227.13202, "r_x2": 545.11273, "r_y2": 219.40295000000003, "r_x3": 483.11902, "r_y3": 219.40295000000003, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 238.09002999999996, "r_x1": 519.39771, "r_y1": 238.09002999999996, "r_x2": 519.39771, "r_y2": 230.36095999999998, "r_x3": 328.78101, "r_y3": 230.36095999999998, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.401, "r_y0": 238.29625999999996, "r_x1": 545.10767, "r_y1": 238.29625999999996, "r_x2": 545.10767, "r_y2": 230.28026999999997, "r_x3": 519.401, "r_y3": 230.28026999999997, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 249.25525000000005, "r_x1": 545.11328, "r_y1": 249.25525000000005, "r_x2": 545.11328, "r_y2": 241.23925999999994, "r_x3": 328.78101, "r_y3": 241.23925999999994, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 260.21423000000004, "r_x1": 333.26422, "r_y1": 260.21423000000004, "r_x2": 333.26422, "r_y2": 252.19824000000006, "r_x3": 328.78101, "r_y3": 252.19824000000006, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 308.862, "t": 263.64423, "r": 545.1142, "b": 326.45413, "coord_origin": "TOPLEFT" }, "confidence": 0.937321662902832, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 271.66022, "r_x1": 324.26477, "r_y1": 271.66022, "r_x2": 324.26477, "r_y2": 263.64423, "r_x3": 308.862, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.57611, "r_y0": 271.66022, "r_x1": 545.10883, "r_y1": 271.66022, "r_x2": 545.10883, "r_y2": 263.64423, "r_x3": 326.57611, "r_y3": 263.64423, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 282.61917000000005, "r_x1": 545.1134, "r_y1": 282.61917000000005, "r_x2": 545.1134, "r_y2": 274.60321, "r_x3": 328.78101, "r_y3": 274.60321, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 293.57816, "r_x1": 545.11328, "r_y1": 293.57816, "r_x2": 545.11328, "r_y2": 285.56219, "r_x3": 328.78101, "r_y3": 285.56219, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 304.53714, "r_x1": 545.11334, "r_y1": 304.53714, "r_x2": 545.11334, "r_y2": 296.52118, "r_x3": 328.78101, "r_y3": 296.52118, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 315.49515, "r_x1": 352.84683, "r_y1": 315.49515, "r_x2": 352.84683, "r_y2": 307.47919, "r_x3": 328.78101, "r_y3": 307.47919, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.23599, "r_y0": 315.28894, "r_x1": 545.1142, "r_y1": 315.28894, "r_x2": 545.1142, "r_y2": 307.55988, "r_x3": 360.23599, "r_y3": 307.55988, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 326.24792, "r_x1": 371.02173, "r_y1": 326.24792, "r_x2": 371.02173, "r_y2": 318.51886, "r_x3": 328.78101, "r_y3": 318.51886, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.021, "r_y0": 326.45413, "r_x1": 502.26227, "r_y1": 326.45413, "r_x2": 502.26227, "r_y2": 318.43817, "r_x3": 371.021, "r_y3": 318.43817, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1" }, { "label": "list_item", "id": 18, "page_no": 8, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.862, "t": 329.88419, "r": 545.11609, "b": 370.77713, "coord_origin": "TOPLEFT" }, "confidence": 0.9027292728424072, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 337.90015, "r_x1": 323.82672, "r_y1": 337.90015, "r_x2": 323.82672, "r_y2": 329.88419, "r_x3": 308.862, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07233, "r_y0": 337.90015, "r_x1": 545.10876, "r_y1": 337.90015, "r_x2": 545.10876, "r_y2": 329.88419, "r_x3": 326.07233, "r_y3": 329.88419, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 348.85916, "r_x1": 545.11346, "r_y1": 348.85916, "r_x2": 545.11346, "r_y2": 340.8432, "r_x3": 328.78101, "r_y3": 340.8432, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 359.81815000000006, "r_x1": 382.7767, "r_y1": 359.81815000000006, "r_x2": 382.7767, "r_y2": 351.80219000000005, "r_x3": 328.78101, "r_y3": 351.80219000000005, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54102, "r_y0": 359.61194, "r_x1": 545.11609, "r_y1": 359.61194, "r_x2": 545.11609, "r_y2": 351.88287, "r_x3": 385.54102, "r_y3": 351.88287, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 370.57092, "r_x1": 443.59579, "r_y1": 370.57092, "r_x2": 443.59579, "r_y2": 362.84186, "r_x3": 328.78101, "r_y3": 362.84186, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59399, "r_y0": 370.77713, "r_x1": 534.48645, "r_y1": 370.77713, "r_x2": 534.48645, "r_y2": 362.76117, "r_x3": 443.59399, "r_y3": 362.76117, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2" }, { "label": "list_item", "id": 21, "page_no": 8, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.862, "t": 374.20618, "r": 545.11346, "b": 437.01706, "coord_origin": "TOPLEFT" }, "confidence": 0.882714569568634, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 382.22214, "r_x1": 324.60281, "r_y1": 382.22214, "r_x2": 324.60281, "r_y2": 374.20618, "r_x3": 308.862, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96487, "r_y0": 382.22214, "r_x1": 362.6604, "r_y1": 382.22214, "r_x2": 362.6604, "r_y2": 374.20618, "r_x3": 326.96487, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69479, "r_y0": 382.22214, "r_x1": 389.6134, "r_y1": 382.22214, "r_x2": 389.6134, "r_y2": 374.20618, "r_x3": 368.69479, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.6478, "r_y0": 382.22214, "r_x1": 424.56445, "r_y1": 382.22214, "r_x2": 424.56445, "r_y2": 374.20618, "r_x3": 395.6478, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.5492899999999, "r_y0": 382.22214, "r_x1": 438.0230399999999, "r_y1": 382.22214, "r_x2": 438.0230399999999, "r_y2": 374.20618, "r_x3": 431.5492899999999, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.05743, "r_y0": 382.22214, "r_x1": 488.5038799999999, "r_y1": 382.22214, "r_x2": 488.5038799999999, "r_y2": 374.20618, "r_x3": 444.05743, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.47974, "r_y0": 382.22214, "r_x1": 515.41205, "r_y1": 382.22214, "r_x2": 515.41205, "r_y2": 374.20618, "r_x3": 495.47974, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.44641, "r_y0": 382.22214, "r_x1": 545.10876, "r_y1": 382.22214, "r_x2": 545.10876, "r_y2": 374.20618, "r_x3": 521.44641, "r_y3": 374.20618, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 393.18112, "r_x1": 545.1134, "r_y1": 393.18112, "r_x2": 545.1134, "r_y2": 385.16516, "r_x3": 328.78101, "r_y3": 385.16516, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 404.14011, "r_x1": 545.11346, "r_y1": 404.14011, "r_x2": 545.11346, "r_y2": 396.12415, "r_x3": 328.78101, "r_y3": 396.12415, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 415.09909, "r_x1": 478.00881999999996, "r_y1": 415.09909, "r_x2": 478.00881999999996, "r_y2": 407.08313, "r_x3": 328.78101, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.0701, "r_y0": 415.09909, "r_x1": 491.53912, "r_y1": 415.09909, "r_x2": 491.53912, "r_y2": 407.08313, "r_x3": 484.0701, "r_y3": 407.08313, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.668, "r_y0": 414.89288, "r_x1": 545.11298, "r_y1": 414.89288, "r_x2": 545.11298, "r_y2": 407.16382, "r_x3": 494.668, "r_y3": 407.16382, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 425.85187, "r_x1": 545.11334, "r_y1": 425.85187, "r_x2": 545.11334, "r_y2": 418.12280000000004, "r_x3": 328.78101, "r_y3": 418.12280000000004, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 436.8108500000001, "r_x1": 360.83591, "r_y1": 436.8108500000001, "r_x2": 360.83591, "r_y2": 429.08179, "r_x3": 328.78101, "r_y3": 429.08179, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.836, "r_y0": 437.01706, "r_x1": 475.63287, "r_y1": 437.01706, "r_x2": 475.63287, "r_y2": 429.0011, "r_x3": 360.836, "r_y3": 429.0011, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1" }, { "label": "list_item", "id": 20, "page_no": 8, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 308.862, "t": 440.44611, "r": 545.11475, "b": 558.05096, "coord_origin": "TOPLEFT" }, "confidence": 0.8896440863609314, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.46207, "r_x1": 324.57407, "r_y1": 448.46207, "r_x2": 324.57407, "r_y2": 440.44611, "r_x3": 308.862, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93179, "r_y0": 448.46207, "r_x1": 545.1087, "r_y1": 448.46207, "r_x2": 545.1087, "r_y2": 440.44611, "r_x3": 326.93179, "r_y3": 440.44611, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 459.42105, "r_x1": 545.11346, "r_y1": 459.42105, "r_x2": 545.11346, "r_y2": 451.40509, "r_x3": 328.78101, "r_y3": 451.40509, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 470.38004, "r_x1": 545.11328, "r_y1": 470.38004, "r_x2": 545.11328, "r_y2": 462.36407, "r_x3": 328.78101, "r_y3": 462.36407, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 481.33902, "r_x1": 545.11328, "r_y1": 481.33902, "r_x2": 545.11328, "r_y2": 473.32306, "r_x3": 328.78101, "r_y3": 473.32306, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 492.298, "r_x1": 545.11328, "r_y1": 492.298, "r_x2": 545.11328, "r_y2": 484.28204, "r_x3": 328.78101, "r_y3": 484.28204, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 503.25699, "r_x1": 545.1134, "r_y1": 503.25699, "r_x2": 545.1134, "r_y2": 495.24103, "r_x3": 328.78101, "r_y3": 495.24103, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 514.21597, "r_x1": 545.1134, "r_y1": 514.21597, "r_x2": 545.1134, "r_y2": 506.20001, "r_x3": 328.78101, "r_y3": 506.20001, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 525.17496, "r_x1": 545.1098, "r_y1": 525.17496, "r_x2": 545.1098, "r_y2": 517.159, "r_x3": 328.78101, "r_y3": 517.159, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 536.13297, "r_x1": 434.56659, "r_y1": 536.13297, "r_x2": 434.56659, "r_y2": 528.117, "r_x3": 328.78101, "r_y3": 528.117, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86401, "r_y0": 535.9267600000001, "r_x1": 545.11115, "r_y1": 535.9267600000001, "r_x2": 545.11115, "r_y2": 528.19769, "r_x3": 437.86401, "r_y3": 528.19769, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 546.8857399999999, "r_x1": 425.73471, "r_y1": 546.8857399999999, "r_x2": 425.73471, "r_y2": 539.15671, "r_x3": 328.78101, "r_y3": 539.15671, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.73602, "r_y0": 547.09196, "r_x1": 545.11475, "r_y1": 547.09196, "r_x2": 545.11475, "r_y2": 539.076, "r_x3": 425.73602, "r_y3": 539.076, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 558.05096, "r_x1": 399.74109, "r_y1": 558.05096, "r_x2": 399.74109, "r_y2": 550.035, "r_x3": 328.78101, "r_y3": 550.035, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6" }, { "label": "list_item", "id": 19, "page_no": 8, "cluster": { "id": 19, "label": "list_item", "bbox": { "l": 308.862, "t": 561.481, "r": 545.1134, "b": 624.29097, "coord_origin": "TOPLEFT" }, "confidence": 0.9025435447692871, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 569.49696, "r_x1": 324.50351, "r_y1": 569.49696, "r_x2": 324.50351, "r_y2": 561.481, "r_x3": 308.862, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85068, "r_y0": 569.49696, "r_x1": 545.10876, "r_y1": 569.49696, "r_x2": 545.10876, "r_y2": 561.481, "r_x3": 326.85068, "r_y3": 561.481, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 580.45596, "r_x1": 545.1134, "r_y1": 580.45596, "r_x2": 545.1134, "r_y2": 572.44, "r_x3": 328.78101, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 591.4149600000001, "r_x1": 545.11334, "r_y1": 591.4149600000001, "r_x2": 545.11334, "r_y2": 583.399, "r_x3": 328.78101, "r_y3": 583.399, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 602.37396, "r_x1": 431.61667, "r_y1": 602.37396, "r_x2": 431.61667, "r_y2": 594.358, "r_x3": 328.78101, "r_y3": 594.358, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69101000000006, "r_y0": 602.16774, "r_x1": 545.11224, "r_y1": 602.16774, "r_x2": 545.11224, "r_y2": 594.4387099999999, "r_x3": 434.69101000000006, "r_y3": 594.4387099999999, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 613.12575, "r_x1": 545.1134, "r_y1": 613.12575, "r_x2": 545.1134, "r_y2": 605.39671, "r_x3": 328.78101, "r_y3": 605.39671, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 624.08475, "r_x1": 367.8028, "r_y1": 624.08475, "r_x2": 367.8028, "r_y2": 616.35571, "r_x3": 328.78101, "r_y3": 616.35571, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.802, "r_y0": 624.29097, "r_x1": 458.69446000000005, "r_y1": 624.29097, "r_x2": 458.69446000000005, "r_y2": 616.2750100000001, "r_x3": 367.802, "r_y3": 616.2750100000001, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1" }, { "label": "list_item", "id": 23, "page_no": 8, "cluster": { "id": 23, "label": "list_item", "bbox": { "l": 308.862, "t": 627.72101, "r": 545.11621, "b": 668.61398, "coord_origin": "TOPLEFT" }, "confidence": 0.8777532577514648, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 635.73697, "r_x1": 324.69476, "r_y1": 635.73697, "r_x2": 324.69476, "r_y2": 627.72101, "r_x3": 308.862, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07065, "r_y0": 635.73697, "r_x1": 545.1087, "r_y1": 635.73697, "r_x2": 545.1087, "r_y2": 627.72101, "r_x3": 327.07065, "r_y3": 627.72101, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 646.69597, "r_x1": 545.11328, "r_y1": 646.69597, "r_x2": 545.11328, "r_y2": 638.68001, "r_x3": 328.78101, "r_y3": 638.68001, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 657.65497, "r_x1": 336.25003, "r_y1": 657.65497, "r_x2": 336.25003, "r_y2": 649.63901, "r_x3": 328.78101, "r_y3": 649.63901, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.10001, "r_y0": 657.44875, "r_x1": 545.11621, "r_y1": 657.44875, "r_x2": 545.11621, "r_y2": 649.71971, "r_x3": 338.10001, "r_y3": 649.71971, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 668.40775, "r_x1": 406.32245, "r_y1": 668.40775, "r_x2": 406.32245, "r_y2": 660.67871, "r_x3": 328.78101, "r_y3": 660.67871, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 668.61398, "r_x1": 521.1189, "r_y1": 668.61398, "r_x2": 521.1189, "r_y2": 660.5980099999999, "r_x3": 406.32202, "r_y3": 660.5980099999999, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3" }, { "label": "list_item", "id": 24, "page_no": 8, "cluster": { "id": 24, "label": "list_item", "bbox": { "l": 308.86203, "t": 672.04301, "r": 545.1134, "b": 712.935974, "coord_origin": "TOPLEFT" }, "confidence": 0.8654531240463257, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 680.05898, "r_x1": 324.71329, "r_y1": 680.05898, "r_x2": 324.71329, "r_y2": 672.04301, "r_x3": 308.86203, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09195, "r_y0": 680.05898, "r_x1": 545.10876, "r_y1": 680.05898, "r_x2": 545.10876, "r_y2": 672.04301, "r_x3": 327.09195, "r_y3": 672.04301, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 691.01797, "r_x1": 482.81488, "r_y1": 691.01797, "r_x2": 482.81488, "r_y2": 683.0020099999999, "r_x3": 328.78104, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75064, "r_y0": 691.01797, "r_x1": 545.1134, "r_y1": 691.01797, "r_x2": 545.1134, "r_y2": 683.0020099999999, "r_x3": 488.75064, "r_y3": 683.0020099999999, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 701.976974, "r_x1": 545.11334, "r_y1": 701.976974, "r_x2": 545.11334, "r_y2": 693.961014, "r_x3": 328.78104, "r_y3": 693.961014, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78104, "r_y0": 712.935974, "r_x1": 379.1543, "r_y1": 712.935974, "r_x2": 379.1543, "r_y2": 704.920013, "r_x3": 328.78104, "r_y3": 704.920013, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.61603, "r_y0": 712.729744, "r_x1": 545.10938, "r_y1": 712.729744, "r_x2": 545.10938, "r_y2": 705.00071, "r_x3": 381.61603, "r_y3": 705.00071, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on" } ], "headers": [ { "label": "page_footer", "id": 22, "page_no": 8, "cluster": { "id": 22, "label": "page_footer", "bbox": { "l": 295.12103, "t": 734.1325870000001, "r": 300.10233, "b": 743.0391500000001, "coord_origin": "TOPLEFT" }, "confidence": 0.8797808885574341, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12103, "r_y0": 743.0391500000001, "r_x1": 300.10233, "r_y1": 743.0391500000001, "r_x2": 300.10233, "r_y2": 734.1325870000001, "r_x3": 295.12103, "r_y3": 734.1325870000001, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" } ] } }, { "page_no": 9, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.69353999999998, "r_x1": 223.58061, "r_y1": 83.69353999999998, "r_x2": 223.58061, "r_y2": 75.96447999999998, "r_x3": 70.030998, "r_y3": 75.96447999999998, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.57901, "r_y0": 83.89977999999996, "r_x1": 286.36176, "r_y1": 83.89977999999996, "r_x2": 286.36176, "r_y2": 75.88378999999998, "r_x3": 223.57901, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 94.85875999999996, "r_x1": 97.916512, "r_y1": 94.85875999999996, "r_x2": 97.916512, "r_y2": 86.84276999999997, "r_x3": 70.031006, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 106.18176000000005, "r_x1": 65.534088, "r_y1": 106.18176000000005, "r_x2": 65.534088, "r_y2": 98.16576999999995, "r_x3": 50.112007, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 106.18176000000005, "r_x1": 286.35867, "r_y1": 106.18176000000005, "r_x2": 286.35867, "r_y2": 98.16576999999995, "r_x3": 67.84832, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 117.14075000000003, "r_x1": 286.36331, "r_y1": 117.14075000000003, "r_x2": 286.36331, "r_y2": 109.12476000000004, "r_x3": 70.031006, "r_y3": 109.12476000000004, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 128.0997299999999, "r_x1": 286.36334, "r_y1": 128.0997299999999, "r_x2": 286.36334, "r_y2": 120.08374000000003, "r_x3": 70.031006, "r_y3": 120.08374000000003, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.05872, "r_x1": 77.500015, "r_y1": 139.05872, "r_x2": 77.500015, "r_y2": 131.04272000000003, "r_x3": 70.031006, "r_y3": 131.04272000000003, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.560005, "r_y0": 138.85248, "r_x1": 286.36578, "r_y1": 138.85248, "r_x2": 286.36578, "r_y2": 131.12341000000004, "r_x3": 80.560005, "r_y3": 131.12341000000004, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.81146, "r_x1": 195.22885, "r_y1": 149.81146, "r_x2": 195.22885, "r_y2": 142.0824, "r_x3": 70.031006, "r_y3": 142.0824, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.231, "r_y0": 150.0177, "r_x1": 286.36548, "r_y1": 150.0177, "r_x2": 286.36548, "r_y2": 142.00171, "r_x3": 195.231, "r_y3": 142.00171, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 160.97668, "r_x1": 120.33251, "r_y1": 160.97668, "r_x2": 120.33251, "r_y2": 152.96069, "r_x3": 70.031006, "r_y3": 152.96069, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 172.30066, "r_x1": 65.534088, "r_y1": 172.30066, "r_x2": 65.534088, "r_y2": 164.28467, "r_x3": 50.112007, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 172.30066, "r_x1": 286.35867, "r_y1": 172.30066, "r_x2": 286.35867, "r_y2": 164.28467, "r_x3": 67.84832, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 183.25964, "r_x1": 286.36337, "r_y1": 183.25964, "r_x2": 286.36337, "r_y2": 175.24365, "r_x3": 70.031006, "r_y3": 175.24365, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 194.21862999999996, "r_x1": 286.36334, "r_y1": 194.21862999999996, "r_x2": 286.36334, "r_y2": 186.20263999999997, "r_x3": 70.031006, "r_y3": 186.20263999999997, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 205.17760999999996, "r_x1": 101.33271, "r_y1": 205.17760999999996, "r_x2": 101.33271, "r_y2": 197.16161999999997, "r_x3": 70.031006, "r_y3": 197.16161999999997, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33101, "r_y0": 204.97136999999998, "r_x1": 286.35791, "r_y1": 204.97136999999998, "r_x2": 286.35791, "r_y2": 197.24230999999997, "r_x3": 104.33101, "r_y3": 197.24230999999997, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 215.92938000000004, "r_x1": 220.48719999999997, "r_y1": 215.92938000000004, "r_x2": 220.48719999999997, "r_y2": 208.20032000000003, "r_x3": 70.031006, "r_y3": 208.20032000000003, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48401000000004, "r_y0": 216.13562000000002, "r_x1": 286.36017, "r_y1": 216.13562000000002, "r_x2": 286.36017, "r_y2": 208.11963000000003, "r_x3": 220.48401000000004, "r_y3": 208.11963000000003, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 227.0946, "r_x1": 166.65294, "r_y1": 227.0946, "r_x2": 166.65294, "r_y2": 219.07861000000003, "r_x3": 70.031006, "r_y3": 219.07861000000003, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 238.41858000000002, "r_x1": 65.650383, "r_y1": 238.41858000000002, "r_x2": 65.650383, "r_y2": 230.40259000000003, "r_x3": 50.112007, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.982063, "r_y0": 238.41858000000002, "r_x1": 286.3587, "r_y1": 238.41858000000002, "r_x2": 286.3587, "r_y2": 230.40259000000003, "r_x3": 67.982063, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 249.37756000000002, "r_x1": 147.16895, "r_y1": 249.37756000000002, "r_x2": 147.16895, "r_y2": 241.36157000000003, "r_x3": 70.031006, "r_y3": 241.36157000000003, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93301, "r_y0": 249.17133, "r_x1": 286.36578, "r_y1": 249.17133, "r_x2": 286.36578, "r_y2": 241.44226000000003, "r_x3": 149.93301, "r_y3": 241.44226000000003, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 260.13031, "r_x1": 244.6875, "r_y1": 260.13031, "r_x2": 244.6875, "r_y2": 252.40125, "r_x3": 70.031013, "r_y3": 252.40125, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69101, "r_y0": 260.33655, "r_x1": 286.35791, "r_y1": 260.33655, "r_x2": 286.35791, "r_y2": 252.32056, "r_x3": 244.69101, "r_y3": 252.32056, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 271.29553, "r_x1": 111.36611, "r_y1": 271.29553, "r_x2": 111.36611, "r_y2": 263.27954, "r_x3": 70.031006, "r_y3": 263.27954, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 282.61951, "r_x1": 66.023834, "r_y1": 282.61951, "r_x2": 66.023834, "r_y2": 274.60357999999997, "r_x3": 50.112007, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.411568, "r_y0": 282.61951, "r_x1": 94.944016, "r_y1": 282.61951, "r_x2": 94.944016, "r_y2": 274.60357999999997, "r_x3": 68.411568, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.8708, "r_y0": 282.61951, "r_x1": 127.26788000000002, "r_y1": 282.61951, "r_x2": 127.26788000000002, "r_y2": 274.60357999999997, "r_x3": 100.8708, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19467, "r_y0": 282.61951, "r_x1": 165.83237, "r_y1": 282.61951, "r_x2": 165.83237, "r_y2": 274.60357999999997, "r_x3": 133.19467, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68269, "r_y0": 282.61951, "r_x1": 194.09445, "r_y1": 282.61951, "r_x2": 194.09445, "r_y2": 274.60357999999997, "r_x3": 172.68269, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02124, "r_y0": 282.61951, "r_x1": 211.4803, "r_y1": 282.61951, "r_x2": 211.4803, "r_y2": 274.60357999999997, "r_x3": 200.02124, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.40708999999998, "r_y0": 282.61951, "r_x1": 239.43755, "r_y1": 282.61951, "r_x2": 239.43755, "r_y2": 274.60357999999997, "r_x3": 217.40708999999998, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.28787000000003, "r_y0": 282.61951, "r_x1": 264.22067, "r_y1": 282.61951, "r_x2": 264.22067, "r_y2": 274.60357999999997, "r_x3": 246.28787000000003, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.14746, "r_y0": 282.61951, "r_x1": 286.35873, "r_y1": 282.61951, "r_x2": 286.35873, "r_y2": 274.60357999999997, "r_x3": 270.14746, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 293.57852, "r_x1": 286.36331, "r_y1": 293.57852, "r_x2": 286.36331, "r_y2": 285.56256, "r_x3": 70.031006, "r_y3": 285.56256, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 304.53751, "r_x1": 286.36331, "r_y1": 304.53751, "r_x2": 286.36331, "r_y2": 296.52155, "r_x3": 70.031006, "r_y3": 296.52155, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 315.49649, "r_x1": 77.500015, "r_y1": 315.49649, "r_x2": 77.500015, "r_y2": 307.48053, "r_x3": 70.031006, "r_y3": 307.48053, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.350006, "r_y0": 315.29028, "r_x1": 286.36627, "r_y1": 315.29028, "r_x2": 286.36627, "r_y2": 307.56122, "r_x3": 79.350006, "r_y3": 307.56122, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 326.24829, "r_x1": 147.57243, "r_y1": 326.24829, "r_x2": 147.57243, "r_y2": 318.51923, "r_x3": 70.031006, "r_y3": 318.51923, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57201, "r_y0": 326.4545, "r_x1": 271.33521, "r_y1": 326.4545, "r_x2": 271.33521, "r_y2": 318.43854, "r_x3": 147.57201, "r_y3": 318.43854, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 337.7785, "r_x1": 65.366135, "r_y1": 337.7785, "r_x2": 65.366135, "r_y2": 329.76254, "r_x3": 50.112007, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.655159, "r_y0": 337.7785, "r_x1": 286.3587, "r_y1": 337.7785, "r_x2": 286.3587, "r_y2": 329.76254, "r_x3": 67.655159, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 348.7375200000001, "r_x1": 286.36334, "r_y1": 348.7375200000001, "r_x2": 286.36334, "r_y2": 340.72156000000007, "r_x3": 70.031006, "r_y3": 340.72156000000007, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 359.6965, "r_x1": 198.82439, "r_y1": 359.6965, "r_x2": 198.82439, "r_y2": 351.68054, "r_x3": 70.031006, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06027, "r_y0": 359.6965, "r_x1": 213.52928, "r_y1": 359.6965, "r_x2": 213.52928, "r_y2": 351.68054, "r_x3": 206.06027, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02101, "r_y0": 359.4903, "r_x1": 286.35815, "r_y1": 359.4903, "r_x2": 286.35815, "r_y2": 351.76123, "r_x3": 217.02101, "r_y3": 351.76123, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 370.44928, "r_x1": 143.08028, "r_y1": 370.44928, "r_x2": 143.08028, "r_y2": 362.72021, "r_x3": 70.031006, "r_y3": 362.72021, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.078, "r_y0": 370.65549000000004, "r_x1": 286.36111, "r_y1": 370.65549000000004, "r_x2": 286.36111, "r_y2": 362.63953000000004, "r_x3": 143.078, "r_y3": 362.63953000000004, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 381.61447, "r_x1": 161.15652, "r_y1": 381.61447, "r_x2": 161.15652, "r_y2": 373.59851, "r_x3": 70.031006, "r_y3": 373.59851, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 392.93848, "r_x1": 65.140724, "r_y1": 392.93848, "r_x2": 65.140724, "r_y2": 384.92252, "r_x3": 50.112007, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.395927, "r_y0": 392.93848, "r_x1": 286.35876, "r_y1": 392.93848, "r_x2": 286.35876, "r_y2": 384.92252, "r_x3": 67.395927, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 403.89749, "r_x1": 286.36337, "r_y1": 403.89749, "r_x2": 286.36337, "r_y2": 395.88153, "r_x3": 70.031006, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 414.85648, "r_x1": 125.47024999999998, "r_y1": 414.85648, "r_x2": 125.47024999999998, "r_y2": 406.84052, "r_x3": 70.031006, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.90764, "r_y0": 414.85648, "r_x1": 230.83444, "r_y1": 414.85648, "r_x2": 230.83444, "r_y2": 406.84052, "r_x3": 133.90764, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27182, "r_y0": 414.85648, "r_x1": 286.36334, "r_y1": 414.85648, "r_x2": 286.36334, "r_y2": 406.84052, "r_x3": 239.27182, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 425.81546, "r_x1": 78.958366, "r_y1": 425.81546, "r_x2": 78.958366, "r_y2": 417.7995, "r_x3": 70.031006, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.254494, "r_y0": 425.81546, "r_x1": 286.36334, "r_y1": 425.81546, "r_x2": 286.36334, "r_y2": 417.7995, "r_x3": 81.254494, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.7734699999999, "r_x1": 196.7621, "r_y1": 436.7734699999999, "r_x2": 196.7621, "r_y2": 428.75751, "r_x3": 70.031006, "r_y3": 428.75751, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.20201, "r_y0": 436.56726, "r_x1": 286.36017, "r_y1": 436.56726, "r_x2": 286.36017, "r_y2": 428.8381999999999, "r_x3": 200.20201, "r_y3": 428.8381999999999, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 447.52624999999995, "r_x1": 189.19447, "r_y1": 447.52624999999995, "r_x2": 189.19447, "r_y2": 439.79717999999997, "r_x3": 70.031006, "r_y3": 439.79717999999997, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.19501, "r_y0": 447.73245, "r_x1": 286.36389, "r_y1": 447.73245, "r_x2": 286.36389, "r_y2": 439.71648999999996, "r_x3": 189.19501, "r_y3": 439.71648999999996, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 458.69144, "r_x1": 158.9239, "r_y1": 458.69144, "r_x2": 158.9239, "r_y2": 450.67548, "r_x3": 70.031006, "r_y3": 450.67548, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 470.01544, "r_x1": 65.910469, "r_y1": 470.01544, "r_x2": 65.910469, "r_y2": 461.99948, "r_x3": 50.112007, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.281181, "r_y0": 470.01544, "r_x1": 286.35873, "r_y1": 470.01544, "r_x2": 286.35873, "r_y2": 461.99948, "r_x3": 68.281181, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 480.97446, "r_x1": 116.27969999999999, "r_y1": 480.97446, "r_x2": 116.27969999999999, "r_y2": 472.9585, "r_x3": 70.031006, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48445, "r_y0": 480.97446, "r_x1": 286.36334, "r_y1": 480.97446, "r_x2": 286.36334, "r_y2": 472.9585, "r_x3": 122.48445, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 491.93344, "r_x1": 103.30532, "r_y1": 491.93344, "r_x2": 103.30532, "r_y2": 483.91748, "r_x3": 70.031006, "r_y3": 483.91748, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.51601, "r_y0": 491.72723, "r_x1": 286.35931, "r_y1": 491.72723, "r_x2": 286.35931, "r_y2": 483.99817, "r_x3": 105.51601, "r_y3": 483.99817, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 502.68622, "r_x1": 212.51607, "r_y1": 502.68622, "r_x2": 212.51607, "r_y2": 494.95715, "r_x3": 70.031006, "r_y3": 494.95715, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51401, "r_y0": 502.89243, "r_x1": 263.55975, "r_y1": 502.89243, "r_x2": 263.55975, "r_y2": 494.87646, "r_x3": 212.51401, "r_y3": 494.87646, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 514.21643, "r_x1": 65.682777, "r_y1": 514.21643, "r_x2": 65.682777, "r_y2": 506.20047, "r_x3": 50.112015, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.019325, "r_y0": 514.21643, "r_x1": 247.37280000000004, "r_y1": 514.21643, "r_x2": 247.37280000000004, "r_y2": 506.20047, "r_x3": 68.019325, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97208000000003, "r_y0": 514.21643, "r_x1": 286.3587, "r_y1": 514.21643, "r_x2": 286.3587, "r_y2": 506.20047, "r_x3": 253.97208000000003, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 525.17545, "r_x1": 265.62408, "r_y1": 525.17545, "r_x2": 265.62408, "r_y2": 517.15948, "r_x3": 70.031013, "r_y3": 517.15948, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.42902, "r_y0": 524.96924, "r_x1": 286.36182, "r_y1": 524.96924, "r_x2": 286.36182, "r_y2": 517.24017, "r_x3": 268.42902, "r_y3": 517.24017, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 535.92822, "r_x1": 286.36337, "r_y1": 535.92822, "r_x2": 286.36337, "r_y2": 528.19916, "r_x3": 70.031021, "r_y3": 528.19916, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 546.88622, "r_x1": 125.25507999999999, "r_y1": 546.88622, "r_x2": 125.25507999999999, "r_y2": 539.15718, "r_x3": 70.031021, "r_y3": 539.15718, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25402, "r_y0": 547.09244, "r_x1": 240.05083, "r_y1": 547.09244, "r_x2": 240.05083, "r_y2": 539.07648, "r_x3": 125.25402, "r_y3": 539.07648, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 558.41644, "r_x1": 66.037048, "r_y1": 558.41644, "r_x2": 66.037048, "r_y2": 550.40048, "r_x3": 50.112022, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.426765, "r_y0": 558.41644, "r_x1": 286.3587, "r_y1": 558.41644, "r_x2": 286.3587, "r_y2": 550.40048, "r_x3": 68.426765, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 569.37544, "r_x1": 137.08176, "r_y1": 569.37544, "r_x2": 137.08176, "r_y2": 561.35948, "r_x3": 70.031021, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.9854, "r_y0": 569.37544, "r_x1": 172.38248, "r_y1": 569.37544, "r_x2": 172.38248, "r_y2": 561.35948, "r_x3": 145.9854, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7038, "r_y0": 569.37544, "r_x1": 286.36337, "r_y1": 569.37544, "r_x2": 286.36337, "r_y2": 561.35948, "r_x3": 178.7038, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 580.33444, "r_x1": 221.00723, "r_y1": 580.33444, "r_x2": 221.00723, "r_y2": 572.31848, "r_x3": 70.031021, "r_y3": 572.31848, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54300999999998, "r_y0": 580.12822, "r_x1": 286.35938, "r_y1": 580.12822, "r_x2": 286.35938, "r_y2": 572.39919, "r_x3": 232.54300999999998, "r_y3": 572.39919, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 591.08722, "r_x1": 135.53058, "r_y1": 591.08722, "r_x2": 135.53058, "r_y2": 583.35818, "r_x3": 70.031021, "r_y3": 583.35818, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53003, "r_y0": 591.29344, "r_x1": 167.89876, "r_y1": 591.29344, "r_x2": 167.89876, "r_y2": 583.27748, "r_x3": 135.53003, "r_y3": 583.27748, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 602.61745, "r_x1": 65.23661, "r_y1": 602.61745, "r_x2": 65.23661, "r_y2": 594.60149, "r_x3": 50.11203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.506203, "r_y0": 602.61745, "r_x1": 286.3587, "r_y1": 602.61745, "r_x2": 286.3587, "r_y2": 594.60149, "r_x3": 67.506203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 613.57645, "r_x1": 109.1066, "r_y1": 613.57645, "r_x2": 109.1066, "r_y2": 605.56049, "r_x3": 70.031029, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.22592, "r_y0": 613.57645, "r_x1": 271.76605, "r_y1": 613.57645, "r_x2": 271.76605, "r_y2": 605.56049, "r_x3": 116.22592, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89435, "r_y0": 613.57645, "r_x1": 286.36337, "r_y1": 613.57645, "r_x2": 286.36337, "r_y2": 605.56049, "r_x3": 278.89435, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 624.32922, "r_x1": 286.3634, "r_y1": 624.32922, "r_x2": 286.3634, "r_y2": 616.60019, "r_x3": 70.031029, "r_y3": 616.60019, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 635.28822, "r_x1": 139.09921, "r_y1": 635.28822, "r_x2": 139.09921, "r_y2": 627.55919, "r_x3": 70.031029, "r_y3": 627.55919, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.09802, "r_y0": 635.49445, "r_x1": 238.95683, "r_y1": 635.49445, "r_x2": 238.95683, "r_y2": 627.47849, "r_x3": 139.09802, "r_y3": 627.47849, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 646.81845, "r_x1": 65.203552, "r_y1": 646.81845, "r_x2": 65.203552, "r_y2": 638.80249, "r_x3": 50.112022, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.468193, "r_y0": 646.81845, "r_x1": 286.35873, "r_y1": 646.81845, "r_x2": 286.35873, "r_y2": 638.80249, "r_x3": 67.468193, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 657.77646, "r_x1": 286.36337, "r_y1": 657.77646, "r_x2": 286.36337, "r_y2": 649.7605, "r_x3": 70.031021, "r_y3": 649.7605, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 668.73547, "r_x1": 286.36334, "r_y1": 668.73547, "r_x2": 286.36334, "r_y2": 660.7195, "r_x3": 70.031021, "r_y3": 660.7195, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 679.69447, "r_x1": 158.45766, "r_y1": 679.69447, "r_x2": 158.45766, "r_y2": 671.6785, "r_x3": 70.031021, "r_y3": 671.6785, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.52802, "r_y0": 679.48824, "r_x1": 286.36249, "r_y1": 679.48824, "r_x2": 286.36249, "r_y2": 671.7592, "r_x3": 160.52802, "r_y3": 671.7592, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 690.44724, "r_x1": 171.42305, "r_y1": 690.44724, "r_x2": 171.42305, "r_y2": 682.7182, "r_x3": 70.031013, "r_y3": 682.7182, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42201, "r_y0": 690.65347, "r_x1": 212.75713, "r_y1": 690.65347, "r_x2": 212.75713, "r_y2": 682.6375, "r_x3": 171.42201, "r_y3": 682.6375, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.977463, "r_x1": 66.506706, "r_y1": 701.977463, "r_x2": 66.506706, "r_y2": 693.961502, "r_x3": 50.112015, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.966896, "r_y0": 701.977463, "r_x1": 80.992294, "r_y1": 701.977463, "r_x2": 80.992294, "r_y2": 693.961502, "r_x3": 68.966896, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.062057, "r_y0": 701.977463, "r_x1": 114.71492999999998, "r_y1": 701.977463, "r_x2": 114.71492999999998, "r_y2": 693.961502, "r_x3": 89.062057, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.24621000000002, "r_y0": 701.977463, "r_x1": 149.1459, "r_y1": 701.977463, "r_x2": 149.1459, "r_y2": 693.961502, "r_x3": 124.24621000000002, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22462, "r_y0": 701.977463, "r_x1": 209.37321, "r_y1": 701.977463, "r_x2": 209.37321, "r_y2": 693.961502, "r_x3": 157.22462, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9045, "r_y0": 701.977463, "r_x1": 231.85196999999997, "r_y1": 701.977463, "r_x2": 231.85196999999997, "r_y2": 693.961502, "r_x3": 218.9045, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93069, "r_y0": 701.977463, "r_x1": 269.32254, "r_y1": 701.977463, "r_x2": 269.32254, "r_y2": 693.961502, "r_x3": 239.93069, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.3923, "r_y0": 701.977463, "r_x1": 286.3587, "r_y1": 701.977463, "r_x2": 286.3587, "r_y2": 693.961502, "r_x3": 277.3923, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 712.936462, "r_x1": 286.36334, "r_y1": 712.936462, "r_x2": 286.36334, "r_y2": 704.920502, "r_x3": 70.031013, "r_y3": 704.920502, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 83.89948000000015, "r_x1": 545.11346, "r_y1": 83.89948000000015, "r_x2": 545.11346, "r_y2": 75.88347999999996, "r_x3": 328.78101, "r_y3": 75.88347999999996, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 94.85748000000001, "r_x1": 472.30618, "r_y1": 94.85748000000001, "r_x2": 472.30618, "r_y2": 86.84149000000002, "r_x3": 328.78101, "r_y3": 86.84149000000002, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.88501, "r_y0": 94.65125, "r_x1": 545.11456, "r_y1": 94.65125, "r_x2": 545.11456, "r_y2": 86.92218000000003, "r_x3": 475.88501, "r_y3": 86.92218000000003, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 105.61023, "r_x1": 371.92734, "r_y1": 105.61023, "r_x2": 371.92734, "r_y2": 97.88116000000002, "r_x3": 328.78101, "r_y3": 97.88116000000002, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.92599, "r_y0": 105.81646999999987, "r_x1": 545.11206, "r_y1": 105.81646999999987, "r_x2": 545.11206, "r_y2": 97.80048, "r_x3": 371.92599, "r_y3": 97.80048, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 116.77544999999998, "r_x1": 417.70087, "r_y1": 116.77544999999998, "r_x2": 417.70087, "r_y2": 108.75945999999999, "r_x3": 328.78101, "r_y3": 108.75945999999999, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 128.73046999999997, "r_x1": 324.33197, "r_y1": 128.73046999999997, "r_x2": 324.33197, "r_y2": 120.71447999999998, "r_x3": 308.862, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65341, "r_y0": 128.73046999999997, "r_x1": 545.10876, "r_y1": 128.73046999999997, "r_x2": 545.10876, "r_y2": 120.71447999999998, "r_x3": 326.65341, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 139.68944999999997, "r_x1": 545.11334, "r_y1": 139.68944999999997, "r_x2": 545.11334, "r_y2": 131.67345999999998, "r_x3": 328.78101, "r_y3": 131.67345999999998, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 150.44219999999996, "r_x1": 545.11328, "r_y1": 150.44219999999996, "r_x2": 545.11328, "r_y2": 142.71312999999998, "r_x3": 328.78101, "r_y3": 142.71312999999998, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.40117999999995, "r_x1": 406.32245, "r_y1": 161.40117999999995, "r_x2": 406.32245, "r_y2": 153.67211999999995, "r_x3": 328.78101, "r_y3": 153.67211999999995, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 161.60742000000005, "r_x1": 506.18085, "r_y1": 161.60742000000005, "r_x2": 506.18085, "r_y2": 153.59142999999995, "r_x3": 406.32202, "r_y3": 153.59142999999995, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.039555, "r_x1": 302.59259, "r_y1": 743.039555, "r_x2": 302.59259, "r_y2": 734.1329920000001, "r_x3": 292.63, "r_y3": 734.1329920000001, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 15, "label": "text", "bbox": { "l": 70.030998, "t": 75.88378999999998, "r": 286.36176, "b": 94.85875999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.6886764168739319, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.69353999999998, "r_x1": 223.58061, "r_y1": 83.69353999999998, "r_x2": 223.58061, "r_y2": 75.96447999999998, "r_x3": 70.030998, "r_y3": 75.96447999999998, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.57901, "r_y0": 83.89977999999996, "r_x1": 286.36176, "r_y1": 83.89977999999996, "r_x2": 286.36176, "r_y2": 75.88378999999998, "r_x3": 223.57901, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 94.85875999999996, "r_x1": 97.916512, "r_y1": 94.85875999999996, "r_x2": 97.916512, "r_y2": 86.84276999999997, "r_x3": 70.031006, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 50.112007, "t": 98.16576999999995, "r": 286.36578, "b": 160.97668, "coord_origin": "TOPLEFT" }, "confidence": 0.7723011374473572, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 106.18176000000005, "r_x1": 65.534088, "r_y1": 106.18176000000005, "r_x2": 65.534088, "r_y2": 98.16576999999995, "r_x3": 50.112007, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 106.18176000000005, "r_x1": 286.35867, "r_y1": 106.18176000000005, "r_x2": 286.35867, "r_y2": 98.16576999999995, "r_x3": 67.84832, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 117.14075000000003, "r_x1": 286.36331, "r_y1": 117.14075000000003, "r_x2": 286.36331, "r_y2": 109.12476000000004, "r_x3": 70.031006, "r_y3": 109.12476000000004, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 128.0997299999999, "r_x1": 286.36334, "r_y1": 128.0997299999999, "r_x2": 286.36334, "r_y2": 120.08374000000003, "r_x3": 70.031006, "r_y3": 120.08374000000003, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.05872, "r_x1": 77.500015, "r_y1": 139.05872, "r_x2": 77.500015, "r_y2": 131.04272000000003, "r_x3": 70.031006, "r_y3": 131.04272000000003, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.560005, "r_y0": 138.85248, "r_x1": 286.36578, "r_y1": 138.85248, "r_x2": 286.36578, "r_y2": 131.12341000000004, "r_x3": 80.560005, "r_y3": 131.12341000000004, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.81146, "r_x1": 195.22885, "r_y1": 149.81146, "r_x2": 195.22885, "r_y2": 142.0824, "r_x3": 70.031006, "r_y3": 142.0824, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.231, "r_y0": 150.0177, "r_x1": 286.36548, "r_y1": 150.0177, "r_x2": 286.36548, "r_y2": 142.00171, "r_x3": 195.231, "r_y3": 142.00171, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 160.97668, "r_x1": 120.33251, "r_y1": 160.97668, "r_x2": 120.33251, "r_y2": 152.96069, "r_x3": 70.031006, "r_y3": 152.96069, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 50.112007, "t": 164.28467, "r": 286.36337, "b": 227.0946, "coord_origin": "TOPLEFT" }, "confidence": 0.8580600619316101, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 172.30066, "r_x1": 65.534088, "r_y1": 172.30066, "r_x2": 65.534088, "r_y2": 164.28467, "r_x3": 50.112007, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 172.30066, "r_x1": 286.35867, "r_y1": 172.30066, "r_x2": 286.35867, "r_y2": 164.28467, "r_x3": 67.84832, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 183.25964, "r_x1": 286.36337, "r_y1": 183.25964, "r_x2": 286.36337, "r_y2": 175.24365, "r_x3": 70.031006, "r_y3": 175.24365, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 194.21862999999996, "r_x1": 286.36334, "r_y1": 194.21862999999996, "r_x2": 286.36334, "r_y2": 186.20263999999997, "r_x3": 70.031006, "r_y3": 186.20263999999997, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 205.17760999999996, "r_x1": 101.33271, "r_y1": 205.17760999999996, "r_x2": 101.33271, "r_y2": 197.16161999999997, "r_x3": 70.031006, "r_y3": 197.16161999999997, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33101, "r_y0": 204.97136999999998, "r_x1": 286.35791, "r_y1": 204.97136999999998, "r_x2": 286.35791, "r_y2": 197.24230999999997, "r_x3": 104.33101, "r_y3": 197.24230999999997, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 215.92938000000004, "r_x1": 220.48719999999997, "r_y1": 215.92938000000004, "r_x2": 220.48719999999997, "r_y2": 208.20032000000003, "r_x3": 70.031006, "r_y3": 208.20032000000003, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48401000000004, "r_y0": 216.13562000000002, "r_x1": 286.36017, "r_y1": 216.13562000000002, "r_x2": 286.36017, "r_y2": 208.11963000000003, "r_x3": 220.48401000000004, "r_y3": 208.11963000000003, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 227.0946, "r_x1": 166.65294, "r_y1": 227.0946, "r_x2": 166.65294, "r_y2": 219.07861000000003, "r_x3": 70.031006, "r_y3": 219.07861000000003, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 50.112007, "t": 230.40259000000003, "r": 286.36578, "b": 271.29553, "coord_origin": "TOPLEFT" }, "confidence": 0.8512731194496155, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 238.41858000000002, "r_x1": 65.650383, "r_y1": 238.41858000000002, "r_x2": 65.650383, "r_y2": 230.40259000000003, "r_x3": 50.112007, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.982063, "r_y0": 238.41858000000002, "r_x1": 286.3587, "r_y1": 238.41858000000002, "r_x2": 286.3587, "r_y2": 230.40259000000003, "r_x3": 67.982063, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 249.37756000000002, "r_x1": 147.16895, "r_y1": 249.37756000000002, "r_x2": 147.16895, "r_y2": 241.36157000000003, "r_x3": 70.031006, "r_y3": 241.36157000000003, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93301, "r_y0": 249.17133, "r_x1": 286.36578, "r_y1": 249.17133, "r_x2": 286.36578, "r_y2": 241.44226000000003, "r_x3": 149.93301, "r_y3": 241.44226000000003, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 260.13031, "r_x1": 244.6875, "r_y1": 260.13031, "r_x2": 244.6875, "r_y2": 252.40125, "r_x3": 70.031013, "r_y3": 252.40125, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69101, "r_y0": 260.33655, "r_x1": 286.35791, "r_y1": 260.33655, "r_x2": 286.35791, "r_y2": 252.32056, "r_x3": 244.69101, "r_y3": 252.32056, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 271.29553, "r_x1": 111.36611, "r_y1": 271.29553, "r_x2": 111.36611, "r_y2": 263.27954, "r_x3": 70.031006, "r_y3": 263.27954, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 50.112007, "t": 274.60357999999997, "r": 286.36627, "b": 326.4545, "coord_origin": "TOPLEFT" }, "confidence": 0.8494512438774109, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 282.61951, "r_x1": 66.023834, "r_y1": 282.61951, "r_x2": 66.023834, "r_y2": 274.60357999999997, "r_x3": 50.112007, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.411568, "r_y0": 282.61951, "r_x1": 94.944016, "r_y1": 282.61951, "r_x2": 94.944016, "r_y2": 274.60357999999997, "r_x3": 68.411568, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.8708, "r_y0": 282.61951, "r_x1": 127.26788000000002, "r_y1": 282.61951, "r_x2": 127.26788000000002, "r_y2": 274.60357999999997, "r_x3": 100.8708, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19467, "r_y0": 282.61951, "r_x1": 165.83237, "r_y1": 282.61951, "r_x2": 165.83237, "r_y2": 274.60357999999997, "r_x3": 133.19467, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68269, "r_y0": 282.61951, "r_x1": 194.09445, "r_y1": 282.61951, "r_x2": 194.09445, "r_y2": 274.60357999999997, "r_x3": 172.68269, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02124, "r_y0": 282.61951, "r_x1": 211.4803, "r_y1": 282.61951, "r_x2": 211.4803, "r_y2": 274.60357999999997, "r_x3": 200.02124, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.40708999999998, "r_y0": 282.61951, "r_x1": 239.43755, "r_y1": 282.61951, "r_x2": 239.43755, "r_y2": 274.60357999999997, "r_x3": 217.40708999999998, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.28787000000003, "r_y0": 282.61951, "r_x1": 264.22067, "r_y1": 282.61951, "r_x2": 264.22067, "r_y2": 274.60357999999997, "r_x3": 246.28787000000003, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.14746, "r_y0": 282.61951, "r_x1": 286.35873, "r_y1": 282.61951, "r_x2": 286.35873, "r_y2": 274.60357999999997, "r_x3": 270.14746, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 293.57852, "r_x1": 286.36331, "r_y1": 293.57852, "r_x2": 286.36331, "r_y2": 285.56256, "r_x3": 70.031006, "r_y3": 285.56256, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 304.53751, "r_x1": 286.36331, "r_y1": 304.53751, "r_x2": 286.36331, "r_y2": 296.52155, "r_x3": 70.031006, "r_y3": 296.52155, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 315.49649, "r_x1": 77.500015, "r_y1": 315.49649, "r_x2": 77.500015, "r_y2": 307.48053, "r_x3": 70.031006, "r_y3": 307.48053, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.350006, "r_y0": 315.29028, "r_x1": 286.36627, "r_y1": 315.29028, "r_x2": 286.36627, "r_y2": 307.56122, "r_x3": 79.350006, "r_y3": 307.56122, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 326.24829, "r_x1": 147.57243, "r_y1": 326.24829, "r_x2": 147.57243, "r_y2": 318.51923, "r_x3": 70.031006, "r_y3": 318.51923, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57201, "r_y0": 326.4545, "r_x1": 271.33521, "r_y1": 326.4545, "r_x2": 271.33521, "r_y2": 318.43854, "r_x3": 147.57201, "r_y3": 318.43854, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 50.112007, "t": 329.76254, "r": 286.36334, "b": 381.61447, "coord_origin": "TOPLEFT" }, "confidence": 0.8567671179771423, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 337.7785, "r_x1": 65.366135, "r_y1": 337.7785, "r_x2": 65.366135, "r_y2": 329.76254, "r_x3": 50.112007, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.655159, "r_y0": 337.7785, "r_x1": 286.3587, "r_y1": 337.7785, "r_x2": 286.3587, "r_y2": 329.76254, "r_x3": 67.655159, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 348.7375200000001, "r_x1": 286.36334, "r_y1": 348.7375200000001, "r_x2": 286.36334, "r_y2": 340.72156000000007, "r_x3": 70.031006, "r_y3": 340.72156000000007, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 359.6965, "r_x1": 198.82439, "r_y1": 359.6965, "r_x2": 198.82439, "r_y2": 351.68054, "r_x3": 70.031006, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06027, "r_y0": 359.6965, "r_x1": 213.52928, "r_y1": 359.6965, "r_x2": 213.52928, "r_y2": 351.68054, "r_x3": 206.06027, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02101, "r_y0": 359.4903, "r_x1": 286.35815, "r_y1": 359.4903, "r_x2": 286.35815, "r_y2": 351.76123, "r_x3": 217.02101, "r_y3": 351.76123, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 370.44928, "r_x1": 143.08028, "r_y1": 370.44928, "r_x2": 143.08028, "r_y2": 362.72021, "r_x3": 70.031006, "r_y3": 362.72021, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.078, "r_y0": 370.65549000000004, "r_x1": 286.36111, "r_y1": 370.65549000000004, "r_x2": 286.36111, "r_y2": 362.63953000000004, "r_x3": 143.078, "r_y3": 362.63953000000004, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 381.61447, "r_x1": 161.15652, "r_y1": 381.61447, "r_x2": 161.15652, "r_y2": 373.59851, "r_x3": 70.031006, "r_y3": 373.59851, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 50.112007, "t": 384.92252, "r": 286.36389, "b": 458.69144, "coord_origin": "TOPLEFT" }, "confidence": 0.8832162618637085, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 392.93848, "r_x1": 65.140724, "r_y1": 392.93848, "r_x2": 65.140724, "r_y2": 384.92252, "r_x3": 50.112007, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.395927, "r_y0": 392.93848, "r_x1": 286.35876, "r_y1": 392.93848, "r_x2": 286.35876, "r_y2": 384.92252, "r_x3": 67.395927, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 403.89749, "r_x1": 286.36337, "r_y1": 403.89749, "r_x2": 286.36337, "r_y2": 395.88153, "r_x3": 70.031006, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 414.85648, "r_x1": 125.47024999999998, "r_y1": 414.85648, "r_x2": 125.47024999999998, "r_y2": 406.84052, "r_x3": 70.031006, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.90764, "r_y0": 414.85648, "r_x1": 230.83444, "r_y1": 414.85648, "r_x2": 230.83444, "r_y2": 406.84052, "r_x3": 133.90764, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27182, "r_y0": 414.85648, "r_x1": 286.36334, "r_y1": 414.85648, "r_x2": 286.36334, "r_y2": 406.84052, "r_x3": 239.27182, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 425.81546, "r_x1": 78.958366, "r_y1": 425.81546, "r_x2": 78.958366, "r_y2": 417.7995, "r_x3": 70.031006, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.254494, "r_y0": 425.81546, "r_x1": 286.36334, "r_y1": 425.81546, "r_x2": 286.36334, "r_y2": 417.7995, "r_x3": 81.254494, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.7734699999999, "r_x1": 196.7621, "r_y1": 436.7734699999999, "r_x2": 196.7621, "r_y2": 428.75751, "r_x3": 70.031006, "r_y3": 428.75751, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.20201, "r_y0": 436.56726, "r_x1": 286.36017, "r_y1": 436.56726, "r_x2": 286.36017, "r_y2": 428.8381999999999, "r_x3": 200.20201, "r_y3": 428.8381999999999, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 447.52624999999995, "r_x1": 189.19447, "r_y1": 447.52624999999995, "r_x2": 189.19447, "r_y2": 439.79717999999997, "r_x3": 70.031006, "r_y3": 439.79717999999997, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.19501, "r_y0": 447.73245, "r_x1": 286.36389, "r_y1": 447.73245, "r_x2": 286.36389, "r_y2": 439.71648999999996, "r_x3": 189.19501, "r_y3": 439.71648999999996, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 458.69144, "r_x1": 158.9239, "r_y1": 458.69144, "r_x2": 158.9239, "r_y2": 450.67548, "r_x3": 70.031006, "r_y3": 450.67548, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 50.112007, "t": 461.99948, "r": 286.36334, "b": 502.89243, "coord_origin": "TOPLEFT" }, "confidence": 0.8431925177574158, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 470.01544, "r_x1": 65.910469, "r_y1": 470.01544, "r_x2": 65.910469, "r_y2": 461.99948, "r_x3": 50.112007, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.281181, "r_y0": 470.01544, "r_x1": 286.35873, "r_y1": 470.01544, "r_x2": 286.35873, "r_y2": 461.99948, "r_x3": 68.281181, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 480.97446, "r_x1": 116.27969999999999, "r_y1": 480.97446, "r_x2": 116.27969999999999, "r_y2": 472.9585, "r_x3": 70.031006, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48445, "r_y0": 480.97446, "r_x1": 286.36334, "r_y1": 480.97446, "r_x2": 286.36334, "r_y2": 472.9585, "r_x3": 122.48445, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 491.93344, "r_x1": 103.30532, "r_y1": 491.93344, "r_x2": 103.30532, "r_y2": 483.91748, "r_x3": 70.031006, "r_y3": 483.91748, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.51601, "r_y0": 491.72723, "r_x1": 286.35931, "r_y1": 491.72723, "r_x2": 286.35931, "r_y2": 483.99817, "r_x3": 105.51601, "r_y3": 483.99817, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 502.68622, "r_x1": 212.51607, "r_y1": 502.68622, "r_x2": 212.51607, "r_y2": 494.95715, "r_x3": 70.031006, "r_y3": 494.95715, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51401, "r_y0": 502.89243, "r_x1": 263.55975, "r_y1": 502.89243, "r_x2": 263.55975, "r_y2": 494.87646, "r_x3": 212.51401, "r_y3": 494.87646, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 50.112015, "t": 506.20047, "r": 286.36337, "b": 547.09244, "coord_origin": "TOPLEFT" }, "confidence": 0.8405635952949524, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 514.21643, "r_x1": 65.682777, "r_y1": 514.21643, "r_x2": 65.682777, "r_y2": 506.20047, "r_x3": 50.112015, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.019325, "r_y0": 514.21643, "r_x1": 247.37280000000004, "r_y1": 514.21643, "r_x2": 247.37280000000004, "r_y2": 506.20047, "r_x3": 68.019325, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97208000000003, "r_y0": 514.21643, "r_x1": 286.3587, "r_y1": 514.21643, "r_x2": 286.3587, "r_y2": 506.20047, "r_x3": 253.97208000000003, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 525.17545, "r_x1": 265.62408, "r_y1": 525.17545, "r_x2": 265.62408, "r_y2": 517.15948, "r_x3": 70.031013, "r_y3": 517.15948, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.42902, "r_y0": 524.96924, "r_x1": 286.36182, "r_y1": 524.96924, "r_x2": 286.36182, "r_y2": 517.24017, "r_x3": 268.42902, "r_y3": 517.24017, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 535.92822, "r_x1": 286.36337, "r_y1": 535.92822, "r_x2": 286.36337, "r_y2": 528.19916, "r_x3": 70.031021, "r_y3": 528.19916, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 546.88622, "r_x1": 125.25507999999999, "r_y1": 546.88622, "r_x2": 125.25507999999999, "r_y2": 539.15718, "r_x3": 70.031021, "r_y3": 539.15718, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25402, "r_y0": 547.09244, "r_x1": 240.05083, "r_y1": 547.09244, "r_x2": 240.05083, "r_y2": 539.07648, "r_x3": 125.25402, "r_y3": 539.07648, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "list_item", "bbox": { "l": 50.112022, "t": 550.40048, "r": 286.36337, "b": 591.29344, "coord_origin": "TOPLEFT" }, "confidence": 0.8241521716117859, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 558.41644, "r_x1": 66.037048, "r_y1": 558.41644, "r_x2": 66.037048, "r_y2": 550.40048, "r_x3": 50.112022, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.426765, "r_y0": 558.41644, "r_x1": 286.3587, "r_y1": 558.41644, "r_x2": 286.3587, "r_y2": 550.40048, "r_x3": 68.426765, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 569.37544, "r_x1": 137.08176, "r_y1": 569.37544, "r_x2": 137.08176, "r_y2": 561.35948, "r_x3": 70.031021, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.9854, "r_y0": 569.37544, "r_x1": 172.38248, "r_y1": 569.37544, "r_x2": 172.38248, "r_y2": 561.35948, "r_x3": 145.9854, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7038, "r_y0": 569.37544, "r_x1": 286.36337, "r_y1": 569.37544, "r_x2": 286.36337, "r_y2": 561.35948, "r_x3": 178.7038, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 580.33444, "r_x1": 221.00723, "r_y1": 580.33444, "r_x2": 221.00723, "r_y2": 572.31848, "r_x3": 70.031021, "r_y3": 572.31848, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54300999999998, "r_y0": 580.12822, "r_x1": 286.35938, "r_y1": 580.12822, "r_x2": 286.35938, "r_y2": 572.39919, "r_x3": 232.54300999999998, "r_y3": 572.39919, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 591.08722, "r_x1": 135.53058, "r_y1": 591.08722, "r_x2": 135.53058, "r_y2": 583.35818, "r_x3": 70.031021, "r_y3": 583.35818, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53003, "r_y0": 591.29344, "r_x1": 167.89876, "r_y1": 591.29344, "r_x2": 167.89876, "r_y2": 583.27748, "r_x3": 135.53003, "r_y3": 583.27748, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 50.11203, "t": 594.60149, "r": 286.3634, "b": 635.49445, "coord_origin": "TOPLEFT" }, "confidence": 0.8360886573791504, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 602.61745, "r_x1": 65.23661, "r_y1": 602.61745, "r_x2": 65.23661, "r_y2": 594.60149, "r_x3": 50.11203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.506203, "r_y0": 602.61745, "r_x1": 286.3587, "r_y1": 602.61745, "r_x2": 286.3587, "r_y2": 594.60149, "r_x3": 67.506203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 613.57645, "r_x1": 109.1066, "r_y1": 613.57645, "r_x2": 109.1066, "r_y2": 605.56049, "r_x3": 70.031029, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.22592, "r_y0": 613.57645, "r_x1": 271.76605, "r_y1": 613.57645, "r_x2": 271.76605, "r_y2": 605.56049, "r_x3": 116.22592, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89435, "r_y0": 613.57645, "r_x1": 286.36337, "r_y1": 613.57645, "r_x2": 286.36337, "r_y2": 605.56049, "r_x3": 278.89435, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 624.32922, "r_x1": 286.3634, "r_y1": 624.32922, "r_x2": 286.3634, "r_y2": 616.60019, "r_x3": 70.031029, "r_y3": 616.60019, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 635.28822, "r_x1": 139.09921, "r_y1": 635.28822, "r_x2": 139.09921, "r_y2": 627.55919, "r_x3": 70.031029, "r_y3": 627.55919, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.09802, "r_y0": 635.49445, "r_x1": 238.95683, "r_y1": 635.49445, "r_x2": 238.95683, "r_y2": 627.47849, "r_x3": 139.09802, "r_y3": 627.47849, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 50.112022, "t": 638.80249, "r": 286.36337, "b": 690.65347, "coord_origin": "TOPLEFT" }, "confidence": 0.8079474568367004, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 646.81845, "r_x1": 65.203552, "r_y1": 646.81845, "r_x2": 65.203552, "r_y2": 638.80249, "r_x3": 50.112022, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.468193, "r_y0": 646.81845, "r_x1": 286.35873, "r_y1": 646.81845, "r_x2": 286.35873, "r_y2": 638.80249, "r_x3": 67.468193, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 657.77646, "r_x1": 286.36337, "r_y1": 657.77646, "r_x2": 286.36337, "r_y2": 649.7605, "r_x3": 70.031021, "r_y3": 649.7605, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 668.73547, "r_x1": 286.36334, "r_y1": 668.73547, "r_x2": 286.36334, "r_y2": 660.7195, "r_x3": 70.031021, "r_y3": 660.7195, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 679.69447, "r_x1": 158.45766, "r_y1": 679.69447, "r_x2": 158.45766, "r_y2": 671.6785, "r_x3": 70.031021, "r_y3": 671.6785, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.52802, "r_y0": 679.48824, "r_x1": 286.36249, "r_y1": 679.48824, "r_x2": 286.36249, "r_y2": 671.7592, "r_x3": 160.52802, "r_y3": 671.7592, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 690.44724, "r_x1": 171.42305, "r_y1": 690.44724, "r_x2": 171.42305, "r_y2": 682.7182, "r_x3": 70.031013, "r_y3": 682.7182, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42201, "r_y0": 690.65347, "r_x1": 212.75713, "r_y1": 690.65347, "r_x2": 212.75713, "r_y2": 682.6375, "r_x3": 171.42201, "r_y3": 682.6375, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 50.112015, "t": 693.961502, "r": 286.36334, "b": 712.936462, "coord_origin": "TOPLEFT" }, "confidence": 0.8385783433914185, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.977463, "r_x1": 66.506706, "r_y1": 701.977463, "r_x2": 66.506706, "r_y2": 693.961502, "r_x3": 50.112015, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.966896, "r_y0": 701.977463, "r_x1": 80.992294, "r_y1": 701.977463, "r_x2": 80.992294, "r_y2": 693.961502, "r_x3": 68.966896, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.062057, "r_y0": 701.977463, "r_x1": 114.71492999999998, "r_y1": 701.977463, "r_x2": 114.71492999999998, "r_y2": 693.961502, "r_x3": 89.062057, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.24621000000002, "r_y0": 701.977463, "r_x1": 149.1459, "r_y1": 701.977463, "r_x2": 149.1459, "r_y2": 693.961502, "r_x3": 124.24621000000002, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22462, "r_y0": 701.977463, "r_x1": 209.37321, "r_y1": 701.977463, "r_x2": 209.37321, "r_y2": 693.961502, "r_x3": 157.22462, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9045, "r_y0": 701.977463, "r_x1": 231.85196999999997, "r_y1": 701.977463, "r_x2": 231.85196999999997, "r_y2": 693.961502, "r_x3": 218.9045, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93069, "r_y0": 701.977463, "r_x1": 269.32254, "r_y1": 701.977463, "r_x2": 269.32254, "r_y2": 693.961502, "r_x3": 239.93069, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.3923, "r_y0": 701.977463, "r_x1": 286.3587, "r_y1": 701.977463, "r_x2": 286.3587, "r_y2": 693.961502, "r_x3": 277.3923, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 712.936462, "r_x1": 286.36334, "r_y1": 712.936462, "r_x2": 286.36334, "r_y2": 704.920502, "r_x3": 70.031013, "r_y3": 704.920502, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "list_item", "bbox": { "l": 328.78101, "t": 75.88347999999996, "r": 545.11456, "b": 116.77544999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.7556979060173035, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 83.89948000000015, "r_x1": 545.11346, "r_y1": 83.89948000000015, "r_x2": 545.11346, "r_y2": 75.88347999999996, "r_x3": 328.78101, "r_y3": 75.88347999999996, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 94.85748000000001, "r_x1": 472.30618, "r_y1": 94.85748000000001, "r_x2": 472.30618, "r_y2": 86.84149000000002, "r_x3": 328.78101, "r_y3": 86.84149000000002, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.88501, "r_y0": 94.65125, "r_x1": 545.11456, "r_y1": 94.65125, "r_x2": 545.11456, "r_y2": 86.92218000000003, "r_x3": 475.88501, "r_y3": 86.92218000000003, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 105.61023, "r_x1": 371.92734, "r_y1": 105.61023, "r_x2": 371.92734, "r_y2": 97.88116000000002, "r_x3": 328.78101, "r_y3": 97.88116000000002, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.92599, "r_y0": 105.81646999999987, "r_x1": 545.11206, "r_y1": 105.81646999999987, "r_x2": 545.11206, "r_y2": 97.80048, "r_x3": 371.92599, "r_y3": 97.80048, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 116.77544999999998, "r_x1": 417.70087, "r_y1": 116.77544999999998, "r_x2": 417.70087, "r_y2": 108.75945999999999, "r_x3": 328.78101, "r_y3": 108.75945999999999, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 120.71447999999998, "r": 545.11334, "b": 161.60742000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.8375797271728516, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 128.73046999999997, "r_x1": 324.33197, "r_y1": 128.73046999999997, "r_x2": 324.33197, "r_y2": 120.71447999999998, "r_x3": 308.862, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65341, "r_y0": 128.73046999999997, "r_x1": 545.10876, "r_y1": 128.73046999999997, "r_x2": 545.10876, "r_y2": 120.71447999999998, "r_x3": 326.65341, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 139.68944999999997, "r_x1": 545.11334, "r_y1": 139.68944999999997, "r_x2": 545.11334, "r_y2": 131.67345999999998, "r_x3": 328.78101, "r_y3": 131.67345999999998, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 150.44219999999996, "r_x1": 545.11328, "r_y1": 150.44219999999996, "r_x2": 545.11328, "r_y2": 142.71312999999998, "r_x3": 328.78101, "r_y3": 142.71312999999998, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.40117999999995, "r_x1": 406.32245, "r_y1": 161.40117999999995, "r_x2": 406.32245, "r_y2": 153.67211999999995, "r_x3": 328.78101, "r_y3": 153.67211999999995, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 161.60742000000005, "r_x1": 506.18085, "r_y1": 161.60742000000005, "r_x2": 506.18085, "r_y2": 153.59142999999995, "r_x3": 406.32202, "r_y3": 153.59142999999995, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.1329920000001, "r": 302.59259, "b": 743.039555, "coord_origin": "TOPLEFT" }, "confidence": 0.9069584012031555, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.039555, "r_x1": 302.59259, "r_y1": 743.039555, "r_x2": 302.59259, "r_y2": 734.1329920000001, "r_x3": 292.63, "r_y3": 734.1329920000001, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 15, "page_no": 9, "cluster": { "id": 15, "label": "text", "bbox": { "l": 70.030998, "t": 75.88378999999998, "r": 286.36176, "b": 94.85875999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.6886764168739319, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.69353999999998, "r_x1": 223.58061, "r_y1": 83.69353999999998, "r_x2": 223.58061, "r_y2": 75.96447999999998, "r_x3": 70.030998, "r_y3": 75.96447999999998, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.57901, "r_y0": 83.89977999999996, "r_x1": 286.36176, "r_y1": 83.89977999999996, "r_x2": 286.36176, "r_y2": 75.88378999999998, "r_x3": 223.57901, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 94.85875999999996, "r_x1": 97.916512, "r_y1": 94.85875999999996, "r_x2": 97.916512, "r_y2": 86.84276999999997, "r_x3": 70.031006, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6" }, { "label": "list_item", "id": 13, "page_no": 9, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.112007, "t": 98.16576999999995, "r": 286.36578, "b": 160.97668, "coord_origin": "TOPLEFT" }, "confidence": 0.7723011374473572, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 106.18176000000005, "r_x1": 65.534088, "r_y1": 106.18176000000005, "r_x2": 65.534088, "r_y2": 98.16576999999995, "r_x3": 50.112007, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 106.18176000000005, "r_x1": 286.35867, "r_y1": 106.18176000000005, "r_x2": 286.35867, "r_y2": 98.16576999999995, "r_x3": 67.84832, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 117.14075000000003, "r_x1": 286.36331, "r_y1": 117.14075000000003, "r_x2": 286.36331, "r_y2": 109.12476000000004, "r_x3": 70.031006, "r_y3": 109.12476000000004, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 128.0997299999999, "r_x1": 286.36334, "r_y1": 128.0997299999999, "r_x2": 286.36334, "r_y2": 120.08374000000003, "r_x3": 70.031006, "r_y3": 120.08374000000003, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.05872, "r_x1": 77.500015, "r_y1": 139.05872, "r_x2": 77.500015, "r_y2": 131.04272000000003, "r_x3": 70.031006, "r_y3": 131.04272000000003, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.560005, "r_y0": 138.85248, "r_x1": 286.36578, "r_y1": 138.85248, "r_x2": 286.36578, "r_y2": 131.12341000000004, "r_x3": 80.560005, "r_y3": 131.12341000000004, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.81146, "r_x1": 195.22885, "r_y1": 149.81146, "r_x2": 195.22885, "r_y2": 142.0824, "r_x3": 70.031006, "r_y3": 142.0824, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.231, "r_y0": 150.0177, "r_x1": 286.36548, "r_y1": 150.0177, "r_x2": 286.36548, "r_y2": 142.00171, "r_x3": 195.231, "r_y3": 142.00171, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 160.97668, "r_x1": 120.33251, "r_y1": 160.97668, "r_x2": 120.33251, "r_y2": 152.96069, "r_x3": 70.031006, "r_y3": 152.96069, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1" }, { "label": "list_item", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.112007, "t": 164.28467, "r": 286.36337, "b": 227.0946, "coord_origin": "TOPLEFT" }, "confidence": 0.8580600619316101, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 172.30066, "r_x1": 65.534088, "r_y1": 172.30066, "r_x2": 65.534088, "r_y2": 164.28467, "r_x3": 50.112007, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 172.30066, "r_x1": 286.35867, "r_y1": 172.30066, "r_x2": 286.35867, "r_y2": 164.28467, "r_x3": 67.84832, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 183.25964, "r_x1": 286.36337, "r_y1": 183.25964, "r_x2": 286.36337, "r_y2": 175.24365, "r_x3": 70.031006, "r_y3": 175.24365, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 194.21862999999996, "r_x1": 286.36334, "r_y1": 194.21862999999996, "r_x2": 286.36334, "r_y2": 186.20263999999997, "r_x3": 70.031006, "r_y3": 186.20263999999997, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 205.17760999999996, "r_x1": 101.33271, "r_y1": 205.17760999999996, "r_x2": 101.33271, "r_y2": 197.16161999999997, "r_x3": 70.031006, "r_y3": 197.16161999999997, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33101, "r_y0": 204.97136999999998, "r_x1": 286.35791, "r_y1": 204.97136999999998, "r_x2": 286.35791, "r_y2": 197.24230999999997, "r_x3": 104.33101, "r_y3": 197.24230999999997, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 215.92938000000004, "r_x1": 220.48719999999997, "r_y1": 215.92938000000004, "r_x2": 220.48719999999997, "r_y2": 208.20032000000003, "r_x3": 70.031006, "r_y3": 208.20032000000003, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48401000000004, "r_y0": 216.13562000000002, "r_x1": 286.36017, "r_y1": 216.13562000000002, "r_x2": 286.36017, "r_y2": 208.11963000000003, "r_x3": 220.48401000000004, "r_y3": 208.11963000000003, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 227.0946, "r_x1": 166.65294, "r_y1": 227.0946, "r_x2": 166.65294, "r_y2": 219.07861000000003, "r_x3": 70.031006, "r_y3": 219.07861000000003, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3" }, { "label": "list_item", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 50.112007, "t": 230.40259000000003, "r": 286.36578, "b": 271.29553, "coord_origin": "TOPLEFT" }, "confidence": 0.8512731194496155, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 238.41858000000002, "r_x1": 65.650383, "r_y1": 238.41858000000002, "r_x2": 65.650383, "r_y2": 230.40259000000003, "r_x3": 50.112007, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.982063, "r_y0": 238.41858000000002, "r_x1": 286.3587, "r_y1": 238.41858000000002, "r_x2": 286.3587, "r_y2": 230.40259000000003, "r_x3": 67.982063, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 249.37756000000002, "r_x1": 147.16895, "r_y1": 249.37756000000002, "r_x2": 147.16895, "r_y2": 241.36157000000003, "r_x3": 70.031006, "r_y3": 241.36157000000003, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93301, "r_y0": 249.17133, "r_x1": 286.36578, "r_y1": 249.17133, "r_x2": 286.36578, "r_y2": 241.44226000000003, "r_x3": 149.93301, "r_y3": 241.44226000000003, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 260.13031, "r_x1": 244.6875, "r_y1": 260.13031, "r_x2": 244.6875, "r_y2": 252.40125, "r_x3": 70.031013, "r_y3": 252.40125, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69101, "r_y0": 260.33655, "r_x1": 286.35791, "r_y1": 260.33655, "r_x2": 286.35791, "r_y2": 252.32056, "r_x3": 244.69101, "r_y3": 252.32056, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 271.29553, "r_x1": 111.36611, "r_y1": 271.29553, "r_x2": 111.36611, "r_y2": 263.27954, "r_x3": 70.031006, "r_y3": 263.27954, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2" }, { "label": "list_item", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.112007, "t": 274.60357999999997, "r": 286.36627, "b": 326.4545, "coord_origin": "TOPLEFT" }, "confidence": 0.8494512438774109, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 282.61951, "r_x1": 66.023834, "r_y1": 282.61951, "r_x2": 66.023834, "r_y2": 274.60357999999997, "r_x3": 50.112007, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.411568, "r_y0": 282.61951, "r_x1": 94.944016, "r_y1": 282.61951, "r_x2": 94.944016, "r_y2": 274.60357999999997, "r_x3": 68.411568, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.8708, "r_y0": 282.61951, "r_x1": 127.26788000000002, "r_y1": 282.61951, "r_x2": 127.26788000000002, "r_y2": 274.60357999999997, "r_x3": 100.8708, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19467, "r_y0": 282.61951, "r_x1": 165.83237, "r_y1": 282.61951, "r_x2": 165.83237, "r_y2": 274.60357999999997, "r_x3": 133.19467, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68269, "r_y0": 282.61951, "r_x1": 194.09445, "r_y1": 282.61951, "r_x2": 194.09445, "r_y2": 274.60357999999997, "r_x3": 172.68269, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02124, "r_y0": 282.61951, "r_x1": 211.4803, "r_y1": 282.61951, "r_x2": 211.4803, "r_y2": 274.60357999999997, "r_x3": 200.02124, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.40708999999998, "r_y0": 282.61951, "r_x1": 239.43755, "r_y1": 282.61951, "r_x2": 239.43755, "r_y2": 274.60357999999997, "r_x3": 217.40708999999998, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.28787000000003, "r_y0": 282.61951, "r_x1": 264.22067, "r_y1": 282.61951, "r_x2": 264.22067, "r_y2": 274.60357999999997, "r_x3": 246.28787000000003, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.14746, "r_y0": 282.61951, "r_x1": 286.35873, "r_y1": 282.61951, "r_x2": 286.35873, "r_y2": 274.60357999999997, "r_x3": 270.14746, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 293.57852, "r_x1": 286.36331, "r_y1": 293.57852, "r_x2": 286.36331, "r_y2": 285.56256, "r_x3": 70.031006, "r_y3": 285.56256, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 304.53751, "r_x1": 286.36331, "r_y1": 304.53751, "r_x2": 286.36331, "r_y2": 296.52155, "r_x3": 70.031006, "r_y3": 296.52155, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 315.49649, "r_x1": 77.500015, "r_y1": 315.49649, "r_x2": 77.500015, "r_y2": 307.48053, "r_x3": 70.031006, "r_y3": 307.48053, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.350006, "r_y0": 315.29028, "r_x1": 286.36627, "r_y1": 315.29028, "r_x2": 286.36627, "r_y2": 307.56122, "r_x3": 79.350006, "r_y3": 307.56122, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 326.24829, "r_x1": 147.57243, "r_y1": 326.24829, "r_x2": 147.57243, "r_y2": 318.51923, "r_x3": 70.031006, "r_y3": 318.51923, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57201, "r_y0": 326.4545, "r_x1": 271.33521, "r_y1": 326.4545, "r_x2": 271.33521, "r_y2": 318.43854, "r_x3": 147.57201, "r_y3": 318.43854, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3" }, { "label": "list_item", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 50.112007, "t": 329.76254, "r": 286.36334, "b": 381.61447, "coord_origin": "TOPLEFT" }, "confidence": 0.8567671179771423, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 337.7785, "r_x1": 65.366135, "r_y1": 337.7785, "r_x2": 65.366135, "r_y2": 329.76254, "r_x3": 50.112007, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.655159, "r_y0": 337.7785, "r_x1": 286.3587, "r_y1": 337.7785, "r_x2": 286.3587, "r_y2": 329.76254, "r_x3": 67.655159, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 348.7375200000001, "r_x1": 286.36334, "r_y1": 348.7375200000001, "r_x2": 286.36334, "r_y2": 340.72156000000007, "r_x3": 70.031006, "r_y3": 340.72156000000007, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 359.6965, "r_x1": 198.82439, "r_y1": 359.6965, "r_x2": 198.82439, "r_y2": 351.68054, "r_x3": 70.031006, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06027, "r_y0": 359.6965, "r_x1": 213.52928, "r_y1": 359.6965, "r_x2": 213.52928, "r_y2": 351.68054, "r_x3": 206.06027, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02101, "r_y0": 359.4903, "r_x1": 286.35815, "r_y1": 359.4903, "r_x2": 286.35815, "r_y2": 351.76123, "r_x3": 217.02101, "r_y3": 351.76123, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 370.44928, "r_x1": 143.08028, "r_y1": 370.44928, "r_x2": 143.08028, "r_y2": 362.72021, "r_x3": 70.031006, "r_y3": 362.72021, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.078, "r_y0": 370.65549000000004, "r_x1": 286.36111, "r_y1": 370.65549000000004, "r_x2": 286.36111, "r_y2": 362.63953000000004, "r_x3": 143.078, "r_y3": 362.63953000000004, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 381.61447, "r_x1": 161.15652, "r_y1": 381.61447, "r_x2": 161.15652, "r_y2": 373.59851, "r_x3": 70.031006, "r_y3": 373.59851, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1" }, { "label": "list_item", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 50.112007, "t": 384.92252, "r": 286.36389, "b": 458.69144, "coord_origin": "TOPLEFT" }, "confidence": 0.8832162618637085, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 392.93848, "r_x1": 65.140724, "r_y1": 392.93848, "r_x2": 65.140724, "r_y2": 384.92252, "r_x3": 50.112007, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.395927, "r_y0": 392.93848, "r_x1": 286.35876, "r_y1": 392.93848, "r_x2": 286.35876, "r_y2": 384.92252, "r_x3": 67.395927, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 403.89749, "r_x1": 286.36337, "r_y1": 403.89749, "r_x2": 286.36337, "r_y2": 395.88153, "r_x3": 70.031006, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 414.85648, "r_x1": 125.47024999999998, "r_y1": 414.85648, "r_x2": 125.47024999999998, "r_y2": 406.84052, "r_x3": 70.031006, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.90764, "r_y0": 414.85648, "r_x1": 230.83444, "r_y1": 414.85648, "r_x2": 230.83444, "r_y2": 406.84052, "r_x3": 133.90764, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27182, "r_y0": 414.85648, "r_x1": 286.36334, "r_y1": 414.85648, "r_x2": 286.36334, "r_y2": 406.84052, "r_x3": 239.27182, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 425.81546, "r_x1": 78.958366, "r_y1": 425.81546, "r_x2": 78.958366, "r_y2": 417.7995, "r_x3": 70.031006, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.254494, "r_y0": 425.81546, "r_x1": 286.36334, "r_y1": 425.81546, "r_x2": 286.36334, "r_y2": 417.7995, "r_x3": 81.254494, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.7734699999999, "r_x1": 196.7621, "r_y1": 436.7734699999999, "r_x2": 196.7621, "r_y2": 428.75751, "r_x3": 70.031006, "r_y3": 428.75751, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.20201, "r_y0": 436.56726, "r_x1": 286.36017, "r_y1": 436.56726, "r_x2": 286.36017, "r_y2": 428.8381999999999, "r_x3": 200.20201, "r_y3": 428.8381999999999, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 447.52624999999995, "r_x1": 189.19447, "r_y1": 447.52624999999995, "r_x2": 189.19447, "r_y2": 439.79717999999997, "r_x3": 70.031006, "r_y3": 439.79717999999997, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.19501, "r_y0": 447.73245, "r_x1": 286.36389, "r_y1": 447.73245, "r_x2": 286.36389, "r_y2": 439.71648999999996, "r_x3": 189.19501, "r_y3": 439.71648999999996, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 458.69144, "r_x1": 158.9239, "r_y1": 458.69144, "r_x2": 158.9239, "r_y2": 450.67548, "r_x3": 70.031006, "r_y3": 450.67548, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5" }, { "label": "list_item", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 50.112007, "t": 461.99948, "r": 286.36334, "b": 502.89243, "coord_origin": "TOPLEFT" }, "confidence": 0.8431925177574158, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 470.01544, "r_x1": 65.910469, "r_y1": 470.01544, "r_x2": 65.910469, "r_y2": 461.99948, "r_x3": 50.112007, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.281181, "r_y0": 470.01544, "r_x1": 286.35873, "r_y1": 470.01544, "r_x2": 286.35873, "r_y2": 461.99948, "r_x3": 68.281181, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 480.97446, "r_x1": 116.27969999999999, "r_y1": 480.97446, "r_x2": 116.27969999999999, "r_y2": 472.9585, "r_x3": 70.031006, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48445, "r_y0": 480.97446, "r_x1": 286.36334, "r_y1": 480.97446, "r_x2": 286.36334, "r_y2": 472.9585, "r_x3": 122.48445, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 491.93344, "r_x1": 103.30532, "r_y1": 491.93344, "r_x2": 103.30532, "r_y2": 483.91748, "r_x3": 70.031006, "r_y3": 483.91748, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.51601, "r_y0": 491.72723, "r_x1": 286.35931, "r_y1": 491.72723, "r_x2": 286.35931, "r_y2": 483.99817, "r_x3": 105.51601, "r_y3": 483.99817, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 502.68622, "r_x1": 212.51607, "r_y1": 502.68622, "r_x2": 212.51607, "r_y2": 494.95715, "r_x3": 70.031006, "r_y3": 494.95715, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51401, "r_y0": 502.89243, "r_x1": 263.55975, "r_y1": 502.89243, "r_x2": 263.55975, "r_y2": 494.87646, "r_x3": 212.51401, "r_y3": 494.87646, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2" }, { "label": "list_item", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 50.112015, "t": 506.20047, "r": 286.36337, "b": 547.09244, "coord_origin": "TOPLEFT" }, "confidence": 0.8405635952949524, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 514.21643, "r_x1": 65.682777, "r_y1": 514.21643, "r_x2": 65.682777, "r_y2": 506.20047, "r_x3": 50.112015, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.019325, "r_y0": 514.21643, "r_x1": 247.37280000000004, "r_y1": 514.21643, "r_x2": 247.37280000000004, "r_y2": 506.20047, "r_x3": 68.019325, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97208000000003, "r_y0": 514.21643, "r_x1": 286.3587, "r_y1": 514.21643, "r_x2": 286.3587, "r_y2": 506.20047, "r_x3": 253.97208000000003, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 525.17545, "r_x1": 265.62408, "r_y1": 525.17545, "r_x2": 265.62408, "r_y2": 517.15948, "r_x3": 70.031013, "r_y3": 517.15948, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.42902, "r_y0": 524.96924, "r_x1": 286.36182, "r_y1": 524.96924, "r_x2": 286.36182, "r_y2": 517.24017, "r_x3": 268.42902, "r_y3": 517.24017, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 535.92822, "r_x1": 286.36337, "r_y1": 535.92822, "r_x2": 286.36337, "r_y2": 528.19916, "r_x3": 70.031021, "r_y3": 528.19916, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 546.88622, "r_x1": 125.25507999999999, "r_y1": 546.88622, "r_x2": 125.25507999999999, "r_y2": 539.15718, "r_x3": 70.031021, "r_y3": 539.15718, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25402, "r_y0": 547.09244, "r_x1": 240.05083, "r_y1": 547.09244, "r_x2": 240.05083, "r_y2": 539.07648, "r_x3": 125.25402, "r_y3": 539.07648, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3" }, { "label": "list_item", "id": 11, "page_no": 9, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.112022, "t": 550.40048, "r": 286.36337, "b": 591.29344, "coord_origin": "TOPLEFT" }, "confidence": 0.8241521716117859, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 558.41644, "r_x1": 66.037048, "r_y1": 558.41644, "r_x2": 66.037048, "r_y2": 550.40048, "r_x3": 50.112022, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.426765, "r_y0": 558.41644, "r_x1": 286.3587, "r_y1": 558.41644, "r_x2": 286.3587, "r_y2": 550.40048, "r_x3": 68.426765, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 569.37544, "r_x1": 137.08176, "r_y1": 569.37544, "r_x2": 137.08176, "r_y2": 561.35948, "r_x3": 70.031021, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.9854, "r_y0": 569.37544, "r_x1": 172.38248, "r_y1": 569.37544, "r_x2": 172.38248, "r_y2": 561.35948, "r_x3": 145.9854, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7038, "r_y0": 569.37544, "r_x1": 286.36337, "r_y1": 569.37544, "r_x2": 286.36337, "r_y2": 561.35948, "r_x3": 178.7038, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 580.33444, "r_x1": 221.00723, "r_y1": 580.33444, "r_x2": 221.00723, "r_y2": 572.31848, "r_x3": 70.031021, "r_y3": 572.31848, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54300999999998, "r_y0": 580.12822, "r_x1": 286.35938, "r_y1": 580.12822, "r_x2": 286.35938, "r_y2": 572.39919, "r_x3": 232.54300999999998, "r_y3": 572.39919, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 591.08722, "r_x1": 135.53058, "r_y1": 591.08722, "r_x2": 135.53058, "r_y2": 583.35818, "r_x3": 70.031021, "r_y3": 583.35818, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53003, "r_y0": 591.29344, "r_x1": 167.89876, "r_y1": 591.29344, "r_x2": 167.89876, "r_y2": 583.27748, "r_x3": 135.53003, "r_y3": 583.27748, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3" }, { "label": "list_item", "id": 10, "page_no": 9, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.11203, "t": 594.60149, "r": 286.3634, "b": 635.49445, "coord_origin": "TOPLEFT" }, "confidence": 0.8360886573791504, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 602.61745, "r_x1": 65.23661, "r_y1": 602.61745, "r_x2": 65.23661, "r_y2": 594.60149, "r_x3": 50.11203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.506203, "r_y0": 602.61745, "r_x1": 286.3587, "r_y1": 602.61745, "r_x2": 286.3587, "r_y2": 594.60149, "r_x3": 67.506203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 613.57645, "r_x1": 109.1066, "r_y1": 613.57645, "r_x2": 109.1066, "r_y2": 605.56049, "r_x3": 70.031029, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.22592, "r_y0": 613.57645, "r_x1": 271.76605, "r_y1": 613.57645, "r_x2": 271.76605, "r_y2": 605.56049, "r_x3": 116.22592, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89435, "r_y0": 613.57645, "r_x1": 286.36337, "r_y1": 613.57645, "r_x2": 286.36337, "r_y2": 605.56049, "r_x3": 278.89435, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 624.32922, "r_x1": 286.3634, "r_y1": 624.32922, "r_x2": 286.3634, "r_y2": 616.60019, "r_x3": 70.031029, "r_y3": 616.60019, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 635.28822, "r_x1": 139.09921, "r_y1": 635.28822, "r_x2": 139.09921, "r_y2": 627.55919, "r_x3": 70.031029, "r_y3": 627.55919, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.09802, "r_y0": 635.49445, "r_x1": 238.95683, "r_y1": 635.49445, "r_x2": 238.95683, "r_y2": 627.47849, "r_x3": 139.09802, "r_y3": 627.47849, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4" }, { "label": "list_item", "id": 12, "page_no": 9, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 50.112022, "t": 638.80249, "r": 286.36337, "b": 690.65347, "coord_origin": "TOPLEFT" }, "confidence": 0.8079474568367004, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 646.81845, "r_x1": 65.203552, "r_y1": 646.81845, "r_x2": 65.203552, "r_y2": 638.80249, "r_x3": 50.112022, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.468193, "r_y0": 646.81845, "r_x1": 286.35873, "r_y1": 646.81845, "r_x2": 286.35873, "r_y2": 638.80249, "r_x3": 67.468193, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 657.77646, "r_x1": 286.36337, "r_y1": 657.77646, "r_x2": 286.36337, "r_y2": 649.7605, "r_x3": 70.031021, "r_y3": 649.7605, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 668.73547, "r_x1": 286.36334, "r_y1": 668.73547, "r_x2": 286.36334, "r_y2": 660.7195, "r_x3": 70.031021, "r_y3": 660.7195, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 679.69447, "r_x1": 158.45766, "r_y1": 679.69447, "r_x2": 158.45766, "r_y2": 671.6785, "r_x3": 70.031021, "r_y3": 671.6785, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.52802, "r_y0": 679.48824, "r_x1": 286.36249, "r_y1": 679.48824, "r_x2": 286.36249, "r_y2": 671.7592, "r_x3": 160.52802, "r_y3": 671.7592, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 690.44724, "r_x1": 171.42305, "r_y1": 690.44724, "r_x2": 171.42305, "r_y2": 682.7182, "r_x3": 70.031013, "r_y3": 682.7182, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42201, "r_y0": 690.65347, "r_x1": 212.75713, "r_y1": 690.65347, "r_x2": 212.75713, "r_y2": 682.6375, "r_x3": 171.42201, "r_y3": 682.6375, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 9, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.112015, "t": 693.961502, "r": 286.36334, "b": 712.936462, "coord_origin": "TOPLEFT" }, "confidence": 0.8385783433914185, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.977463, "r_x1": 66.506706, "r_y1": 701.977463, "r_x2": 66.506706, "r_y2": 693.961502, "r_x3": 50.112015, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.966896, "r_y0": 701.977463, "r_x1": 80.992294, "r_y1": 701.977463, "r_x2": 80.992294, "r_y2": 693.961502, "r_x3": 68.966896, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.062057, "r_y0": 701.977463, "r_x1": 114.71492999999998, "r_y1": 701.977463, "r_x2": 114.71492999999998, "r_y2": 693.961502, "r_x3": 89.062057, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.24621000000002, "r_y0": 701.977463, "r_x1": 149.1459, "r_y1": 701.977463, "r_x2": 149.1459, "r_y2": 693.961502, "r_x3": 124.24621000000002, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22462, "r_y0": 701.977463, "r_x1": 209.37321, "r_y1": 701.977463, "r_x2": 209.37321, "r_y2": 693.961502, "r_x3": 157.22462, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9045, "r_y0": 701.977463, "r_x1": 231.85196999999997, "r_y1": 701.977463, "r_x2": 231.85196999999997, "r_y2": 693.961502, "r_x3": 218.9045, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93069, "r_y0": 701.977463, "r_x1": 269.32254, "r_y1": 701.977463, "r_x2": 269.32254, "r_y2": 693.961502, "r_x3": 239.93069, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.3923, "r_y0": 701.977463, "r_x1": 286.3587, "r_y1": 701.977463, "r_x2": 286.3587, "r_y2": 693.961502, "r_x3": 277.3923, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 712.936462, "r_x1": 286.36334, "r_y1": 712.936462, "r_x2": 286.36334, "r_y2": 704.920502, "r_x3": 70.031013, "r_y3": 704.920502, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model," }, { "label": "list_item", "id": 14, "page_no": 9, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 328.78101, "t": 75.88347999999996, "r": 545.11456, "b": 116.77544999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.7556979060173035, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 83.89948000000015, "r_x1": 545.11346, "r_y1": 83.89948000000015, "r_x2": 545.11346, "r_y2": 75.88347999999996, "r_x3": 328.78101, "r_y3": 75.88347999999996, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 94.85748000000001, "r_x1": 472.30618, "r_y1": 94.85748000000001, "r_x2": 472.30618, "r_y2": 86.84149000000002, "r_x3": 328.78101, "r_y3": 86.84149000000002, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.88501, "r_y0": 94.65125, "r_x1": 545.11456, "r_y1": 94.65125, "r_x2": 545.11456, "r_y2": 86.92218000000003, "r_x3": 475.88501, "r_y3": 86.92218000000003, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 105.61023, "r_x1": 371.92734, "r_y1": 105.61023, "r_x2": 371.92734, "r_y2": 97.88116000000002, "r_x3": 328.78101, "r_y3": 97.88116000000002, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.92599, "r_y0": 105.81646999999987, "r_x1": 545.11206, "r_y1": 105.81646999999987, "r_x2": 545.11206, "r_y2": 97.80048, "r_x3": 371.92599, "r_y3": 97.80048, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 116.77544999999998, "r_x1": 417.70087, "r_y1": 116.77544999999998, "r_x2": 417.70087, "r_y2": 108.75945999999999, "r_x3": 328.78101, "r_y3": 108.75945999999999, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7" }, { "label": "list_item", "id": 9, "page_no": 9, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 120.71447999999998, "r": 545.11334, "b": 161.60742000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.8375797271728516, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 128.73046999999997, "r_x1": 324.33197, "r_y1": 128.73046999999997, "r_x2": 324.33197, "r_y2": 120.71447999999998, "r_x3": 308.862, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65341, "r_y0": 128.73046999999997, "r_x1": 545.10876, "r_y1": 128.73046999999997, "r_x2": 545.10876, "r_y2": 120.71447999999998, "r_x3": 326.65341, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 139.68944999999997, "r_x1": 545.11334, "r_y1": 139.68944999999997, "r_x2": 545.11334, "r_y2": 131.67345999999998, "r_x3": 328.78101, "r_y3": 131.67345999999998, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 150.44219999999996, "r_x1": 545.11328, "r_y1": 150.44219999999996, "r_x2": 545.11328, "r_y2": 142.71312999999998, "r_x3": 328.78101, "r_y3": 142.71312999999998, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.40117999999995, "r_x1": 406.32245, "r_y1": 161.40117999999995, "r_x2": 406.32245, "r_y2": 153.67211999999995, "r_x3": 328.78101, "r_y3": 153.67211999999995, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 161.60742000000005, "r_x1": 506.18085, "r_y1": 161.60742000000005, "r_x2": 506.18085, "r_y2": 153.59142999999995, "r_x3": 406.32202, "r_y3": 153.59142999999995, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1" }, { "label": "page_footer", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.1329920000001, "r": 302.59259, "b": 743.039555, "coord_origin": "TOPLEFT" }, "confidence": 0.9069584012031555, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.039555, "r_x1": 302.59259, "r_y1": 743.039555, "r_x2": 302.59259, "r_y2": 734.1329920000001, "r_x3": 292.63, "r_y3": 734.1329920000001, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" } ], "body": [ { "label": "text", "id": 15, "page_no": 9, "cluster": { "id": 15, "label": "text", "bbox": { "l": 70.030998, "t": 75.88378999999998, "r": 286.36176, "b": 94.85875999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.6886764168739319, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.030998, "r_y0": 83.69353999999998, "r_x1": 223.58061, "r_y1": 83.69353999999998, "r_x2": 223.58061, "r_y2": 75.96447999999998, "r_x3": 70.030998, "r_y3": 75.96447999999998, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.57901, "r_y0": 83.89977999999996, "r_x1": 286.36176, "r_y1": 83.89977999999996, "r_x2": 286.36176, "r_y2": 75.88378999999998, "r_x3": 223.57901, "r_y3": 75.88378999999998, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 94.85875999999996, "r_x1": 97.916512, "r_y1": 94.85875999999996, "r_x2": 97.916512, "r_y2": 86.84276999999997, "r_x3": 70.031006, "r_y3": 86.84276999999997, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6" }, { "label": "list_item", "id": 13, "page_no": 9, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.112007, "t": 98.16576999999995, "r": 286.36578, "b": 160.97668, "coord_origin": "TOPLEFT" }, "confidence": 0.7723011374473572, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 106.18176000000005, "r_x1": 65.534088, "r_y1": 106.18176000000005, "r_x2": 65.534088, "r_y2": 98.16576999999995, "r_x3": 50.112007, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 106.18176000000005, "r_x1": 286.35867, "r_y1": 106.18176000000005, "r_x2": 286.35867, "r_y2": 98.16576999999995, "r_x3": 67.84832, "r_y3": 98.16576999999995, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 117.14075000000003, "r_x1": 286.36331, "r_y1": 117.14075000000003, "r_x2": 286.36331, "r_y2": 109.12476000000004, "r_x3": 70.031006, "r_y3": 109.12476000000004, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 128.0997299999999, "r_x1": 286.36334, "r_y1": 128.0997299999999, "r_x2": 286.36334, "r_y2": 120.08374000000003, "r_x3": 70.031006, "r_y3": 120.08374000000003, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 139.05872, "r_x1": 77.500015, "r_y1": 139.05872, "r_x2": 77.500015, "r_y2": 131.04272000000003, "r_x3": 70.031006, "r_y3": 131.04272000000003, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.560005, "r_y0": 138.85248, "r_x1": 286.36578, "r_y1": 138.85248, "r_x2": 286.36578, "r_y2": 131.12341000000004, "r_x3": 80.560005, "r_y3": 131.12341000000004, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 149.81146, "r_x1": 195.22885, "r_y1": 149.81146, "r_x2": 195.22885, "r_y2": 142.0824, "r_x3": 70.031006, "r_y3": 142.0824, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.231, "r_y0": 150.0177, "r_x1": 286.36548, "r_y1": 150.0177, "r_x2": 286.36548, "r_y2": 142.00171, "r_x3": 195.231, "r_y3": 142.00171, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 160.97668, "r_x1": 120.33251, "r_y1": 160.97668, "r_x2": 120.33251, "r_y2": 152.96069, "r_x3": 70.031006, "r_y3": 152.96069, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1" }, { "label": "list_item", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.112007, "t": 164.28467, "r": 286.36337, "b": 227.0946, "coord_origin": "TOPLEFT" }, "confidence": 0.8580600619316101, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 172.30066, "r_x1": 65.534088, "r_y1": 172.30066, "r_x2": 65.534088, "r_y2": 164.28467, "r_x3": 50.112007, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.84832, "r_y0": 172.30066, "r_x1": 286.35867, "r_y1": 172.30066, "r_x2": 286.35867, "r_y2": 164.28467, "r_x3": 67.84832, "r_y3": 164.28467, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 183.25964, "r_x1": 286.36337, "r_y1": 183.25964, "r_x2": 286.36337, "r_y2": 175.24365, "r_x3": 70.031006, "r_y3": 175.24365, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 194.21862999999996, "r_x1": 286.36334, "r_y1": 194.21862999999996, "r_x2": 286.36334, "r_y2": 186.20263999999997, "r_x3": 70.031006, "r_y3": 186.20263999999997, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 205.17760999999996, "r_x1": 101.33271, "r_y1": 205.17760999999996, "r_x2": 101.33271, "r_y2": 197.16161999999997, "r_x3": 70.031006, "r_y3": 197.16161999999997, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33101, "r_y0": 204.97136999999998, "r_x1": 286.35791, "r_y1": 204.97136999999998, "r_x2": 286.35791, "r_y2": 197.24230999999997, "r_x3": 104.33101, "r_y3": 197.24230999999997, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 215.92938000000004, "r_x1": 220.48719999999997, "r_y1": 215.92938000000004, "r_x2": 220.48719999999997, "r_y2": 208.20032000000003, "r_x3": 70.031006, "r_y3": 208.20032000000003, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48401000000004, "r_y0": 216.13562000000002, "r_x1": 286.36017, "r_y1": 216.13562000000002, "r_x2": 286.36017, "r_y2": 208.11963000000003, "r_x3": 220.48401000000004, "r_y3": 208.11963000000003, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 227.0946, "r_x1": 166.65294, "r_y1": 227.0946, "r_x2": 166.65294, "r_y2": 219.07861000000003, "r_x3": 70.031006, "r_y3": 219.07861000000003, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3" }, { "label": "list_item", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 50.112007, "t": 230.40259000000003, "r": 286.36578, "b": 271.29553, "coord_origin": "TOPLEFT" }, "confidence": 0.8512731194496155, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 238.41858000000002, "r_x1": 65.650383, "r_y1": 238.41858000000002, "r_x2": 65.650383, "r_y2": 230.40259000000003, "r_x3": 50.112007, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.982063, "r_y0": 238.41858000000002, "r_x1": 286.3587, "r_y1": 238.41858000000002, "r_x2": 286.3587, "r_y2": 230.40259000000003, "r_x3": 67.982063, "r_y3": 230.40259000000003, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 249.37756000000002, "r_x1": 147.16895, "r_y1": 249.37756000000002, "r_x2": 147.16895, "r_y2": 241.36157000000003, "r_x3": 70.031006, "r_y3": 241.36157000000003, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93301, "r_y0": 249.17133, "r_x1": 286.36578, "r_y1": 249.17133, "r_x2": 286.36578, "r_y2": 241.44226000000003, "r_x3": 149.93301, "r_y3": 241.44226000000003, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 260.13031, "r_x1": 244.6875, "r_y1": 260.13031, "r_x2": 244.6875, "r_y2": 252.40125, "r_x3": 70.031013, "r_y3": 252.40125, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69101, "r_y0": 260.33655, "r_x1": 286.35791, "r_y1": 260.33655, "r_x2": 286.35791, "r_y2": 252.32056, "r_x3": 244.69101, "r_y3": 252.32056, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 271.29553, "r_x1": 111.36611, "r_y1": 271.29553, "r_x2": 111.36611, "r_y2": 263.27954, "r_x3": 70.031006, "r_y3": 263.27954, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2" }, { "label": "list_item", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.112007, "t": 274.60357999999997, "r": 286.36627, "b": 326.4545, "coord_origin": "TOPLEFT" }, "confidence": 0.8494512438774109, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 282.61951, "r_x1": 66.023834, "r_y1": 282.61951, "r_x2": 66.023834, "r_y2": 274.60357999999997, "r_x3": 50.112007, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.411568, "r_y0": 282.61951, "r_x1": 94.944016, "r_y1": 282.61951, "r_x2": 94.944016, "r_y2": 274.60357999999997, "r_x3": 68.411568, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.8708, "r_y0": 282.61951, "r_x1": 127.26788000000002, "r_y1": 282.61951, "r_x2": 127.26788000000002, "r_y2": 274.60357999999997, "r_x3": 100.8708, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19467, "r_y0": 282.61951, "r_x1": 165.83237, "r_y1": 282.61951, "r_x2": 165.83237, "r_y2": 274.60357999999997, "r_x3": 133.19467, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68269, "r_y0": 282.61951, "r_x1": 194.09445, "r_y1": 282.61951, "r_x2": 194.09445, "r_y2": 274.60357999999997, "r_x3": 172.68269, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02124, "r_y0": 282.61951, "r_x1": 211.4803, "r_y1": 282.61951, "r_x2": 211.4803, "r_y2": 274.60357999999997, "r_x3": 200.02124, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.40708999999998, "r_y0": 282.61951, "r_x1": 239.43755, "r_y1": 282.61951, "r_x2": 239.43755, "r_y2": 274.60357999999997, "r_x3": 217.40708999999998, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.28787000000003, "r_y0": 282.61951, "r_x1": 264.22067, "r_y1": 282.61951, "r_x2": 264.22067, "r_y2": 274.60357999999997, "r_x3": 246.28787000000003, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.14746, "r_y0": 282.61951, "r_x1": 286.35873, "r_y1": 282.61951, "r_x2": 286.35873, "r_y2": 274.60357999999997, "r_x3": 270.14746, "r_y3": 274.60357999999997, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 293.57852, "r_x1": 286.36331, "r_y1": 293.57852, "r_x2": 286.36331, "r_y2": 285.56256, "r_x3": 70.031006, "r_y3": 285.56256, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 304.53751, "r_x1": 286.36331, "r_y1": 304.53751, "r_x2": 286.36331, "r_y2": 296.52155, "r_x3": 70.031006, "r_y3": 296.52155, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 315.49649, "r_x1": 77.500015, "r_y1": 315.49649, "r_x2": 77.500015, "r_y2": 307.48053, "r_x3": 70.031006, "r_y3": 307.48053, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.350006, "r_y0": 315.29028, "r_x1": 286.36627, "r_y1": 315.29028, "r_x2": 286.36627, "r_y2": 307.56122, "r_x3": 79.350006, "r_y3": 307.56122, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 326.24829, "r_x1": 147.57243, "r_y1": 326.24829, "r_x2": 147.57243, "r_y2": 318.51923, "r_x3": 70.031006, "r_y3": 318.51923, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57201, "r_y0": 326.4545, "r_x1": 271.33521, "r_y1": 326.4545, "r_x2": 271.33521, "r_y2": 318.43854, "r_x3": 147.57201, "r_y3": 318.43854, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3" }, { "label": "list_item", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 50.112007, "t": 329.76254, "r": 286.36334, "b": 381.61447, "coord_origin": "TOPLEFT" }, "confidence": 0.8567671179771423, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 337.7785, "r_x1": 65.366135, "r_y1": 337.7785, "r_x2": 65.366135, "r_y2": 329.76254, "r_x3": 50.112007, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.655159, "r_y0": 337.7785, "r_x1": 286.3587, "r_y1": 337.7785, "r_x2": 286.3587, "r_y2": 329.76254, "r_x3": 67.655159, "r_y3": 329.76254, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 348.7375200000001, "r_x1": 286.36334, "r_y1": 348.7375200000001, "r_x2": 286.36334, "r_y2": 340.72156000000007, "r_x3": 70.031006, "r_y3": 340.72156000000007, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 359.6965, "r_x1": 198.82439, "r_y1": 359.6965, "r_x2": 198.82439, "r_y2": 351.68054, "r_x3": 70.031006, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06027, "r_y0": 359.6965, "r_x1": 213.52928, "r_y1": 359.6965, "r_x2": 213.52928, "r_y2": 351.68054, "r_x3": 206.06027, "r_y3": 351.68054, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02101, "r_y0": 359.4903, "r_x1": 286.35815, "r_y1": 359.4903, "r_x2": 286.35815, "r_y2": 351.76123, "r_x3": 217.02101, "r_y3": 351.76123, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 370.44928, "r_x1": 143.08028, "r_y1": 370.44928, "r_x2": 143.08028, "r_y2": 362.72021, "r_x3": 70.031006, "r_y3": 362.72021, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.078, "r_y0": 370.65549000000004, "r_x1": 286.36111, "r_y1": 370.65549000000004, "r_x2": 286.36111, "r_y2": 362.63953000000004, "r_x3": 143.078, "r_y3": 362.63953000000004, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 381.61447, "r_x1": 161.15652, "r_y1": 381.61447, "r_x2": 161.15652, "r_y2": 373.59851, "r_x3": 70.031006, "r_y3": 373.59851, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1" }, { "label": "list_item", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 50.112007, "t": 384.92252, "r": 286.36389, "b": 458.69144, "coord_origin": "TOPLEFT" }, "confidence": 0.8832162618637085, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 392.93848, "r_x1": 65.140724, "r_y1": 392.93848, "r_x2": 65.140724, "r_y2": 384.92252, "r_x3": 50.112007, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.395927, "r_y0": 392.93848, "r_x1": 286.35876, "r_y1": 392.93848, "r_x2": 286.35876, "r_y2": 384.92252, "r_x3": 67.395927, "r_y3": 384.92252, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 403.89749, "r_x1": 286.36337, "r_y1": 403.89749, "r_x2": 286.36337, "r_y2": 395.88153, "r_x3": 70.031006, "r_y3": 395.88153, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 414.85648, "r_x1": 125.47024999999998, "r_y1": 414.85648, "r_x2": 125.47024999999998, "r_y2": 406.84052, "r_x3": 70.031006, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.90764, "r_y0": 414.85648, "r_x1": 230.83444, "r_y1": 414.85648, "r_x2": 230.83444, "r_y2": 406.84052, "r_x3": 133.90764, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27182, "r_y0": 414.85648, "r_x1": 286.36334, "r_y1": 414.85648, "r_x2": 286.36334, "r_y2": 406.84052, "r_x3": 239.27182, "r_y3": 406.84052, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 425.81546, "r_x1": 78.958366, "r_y1": 425.81546, "r_x2": 78.958366, "r_y2": 417.7995, "r_x3": 70.031006, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.254494, "r_y0": 425.81546, "r_x1": 286.36334, "r_y1": 425.81546, "r_x2": 286.36334, "r_y2": 417.7995, "r_x3": 81.254494, "r_y3": 417.7995, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 436.7734699999999, "r_x1": 196.7621, "r_y1": 436.7734699999999, "r_x2": 196.7621, "r_y2": 428.75751, "r_x3": 70.031006, "r_y3": 428.75751, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.20201, "r_y0": 436.56726, "r_x1": 286.36017, "r_y1": 436.56726, "r_x2": 286.36017, "r_y2": 428.8381999999999, "r_x3": 200.20201, "r_y3": 428.8381999999999, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 447.52624999999995, "r_x1": 189.19447, "r_y1": 447.52624999999995, "r_x2": 189.19447, "r_y2": 439.79717999999997, "r_x3": 70.031006, "r_y3": 439.79717999999997, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.19501, "r_y0": 447.73245, "r_x1": 286.36389, "r_y1": 447.73245, "r_x2": 286.36389, "r_y2": 439.71648999999996, "r_x3": 189.19501, "r_y3": 439.71648999999996, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 458.69144, "r_x1": 158.9239, "r_y1": 458.69144, "r_x2": 158.9239, "r_y2": 450.67548, "r_x3": 70.031006, "r_y3": 450.67548, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5" }, { "label": "list_item", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 50.112007, "t": 461.99948, "r": 286.36334, "b": 502.89243, "coord_origin": "TOPLEFT" }, "confidence": 0.8431925177574158, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112007, "r_y0": 470.01544, "r_x1": 65.910469, "r_y1": 470.01544, "r_x2": 65.910469, "r_y2": 461.99948, "r_x3": 50.112007, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.281181, "r_y0": 470.01544, "r_x1": 286.35873, "r_y1": 470.01544, "r_x2": 286.35873, "r_y2": 461.99948, "r_x3": 68.281181, "r_y3": 461.99948, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 480.97446, "r_x1": 116.27969999999999, "r_y1": 480.97446, "r_x2": 116.27969999999999, "r_y2": 472.9585, "r_x3": 70.031006, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48445, "r_y0": 480.97446, "r_x1": 286.36334, "r_y1": 480.97446, "r_x2": 286.36334, "r_y2": 472.9585, "r_x3": 122.48445, "r_y3": 472.9585, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 491.93344, "r_x1": 103.30532, "r_y1": 491.93344, "r_x2": 103.30532, "r_y2": 483.91748, "r_x3": 70.031006, "r_y3": 483.91748, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.51601, "r_y0": 491.72723, "r_x1": 286.35931, "r_y1": 491.72723, "r_x2": 286.35931, "r_y2": 483.99817, "r_x3": 105.51601, "r_y3": 483.99817, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031006, "r_y0": 502.68622, "r_x1": 212.51607, "r_y1": 502.68622, "r_x2": 212.51607, "r_y2": 494.95715, "r_x3": 70.031006, "r_y3": 494.95715, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51401, "r_y0": 502.89243, "r_x1": 263.55975, "r_y1": 502.89243, "r_x2": 263.55975, "r_y2": 494.87646, "r_x3": 212.51401, "r_y3": 494.87646, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2" }, { "label": "list_item", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 50.112015, "t": 506.20047, "r": 286.36337, "b": 547.09244, "coord_origin": "TOPLEFT" }, "confidence": 0.8405635952949524, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 514.21643, "r_x1": 65.682777, "r_y1": 514.21643, "r_x2": 65.682777, "r_y2": 506.20047, "r_x3": 50.112015, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.019325, "r_y0": 514.21643, "r_x1": 247.37280000000004, "r_y1": 514.21643, "r_x2": 247.37280000000004, "r_y2": 506.20047, "r_x3": 68.019325, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97208000000003, "r_y0": 514.21643, "r_x1": 286.3587, "r_y1": 514.21643, "r_x2": 286.3587, "r_y2": 506.20047, "r_x3": 253.97208000000003, "r_y3": 506.20047, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 525.17545, "r_x1": 265.62408, "r_y1": 525.17545, "r_x2": 265.62408, "r_y2": 517.15948, "r_x3": 70.031013, "r_y3": 517.15948, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.42902, "r_y0": 524.96924, "r_x1": 286.36182, "r_y1": 524.96924, "r_x2": 286.36182, "r_y2": 517.24017, "r_x3": 268.42902, "r_y3": 517.24017, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 535.92822, "r_x1": 286.36337, "r_y1": 535.92822, "r_x2": 286.36337, "r_y2": 528.19916, "r_x3": 70.031021, "r_y3": 528.19916, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 546.88622, "r_x1": 125.25507999999999, "r_y1": 546.88622, "r_x2": 125.25507999999999, "r_y2": 539.15718, "r_x3": 70.031021, "r_y3": 539.15718, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25402, "r_y0": 547.09244, "r_x1": 240.05083, "r_y1": 547.09244, "r_x2": 240.05083, "r_y2": 539.07648, "r_x3": 125.25402, "r_y3": 539.07648, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3" }, { "label": "list_item", "id": 11, "page_no": 9, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.112022, "t": 550.40048, "r": 286.36337, "b": 591.29344, "coord_origin": "TOPLEFT" }, "confidence": 0.8241521716117859, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 558.41644, "r_x1": 66.037048, "r_y1": 558.41644, "r_x2": 66.037048, "r_y2": 550.40048, "r_x3": 50.112022, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.426765, "r_y0": 558.41644, "r_x1": 286.3587, "r_y1": 558.41644, "r_x2": 286.3587, "r_y2": 550.40048, "r_x3": 68.426765, "r_y3": 550.40048, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 569.37544, "r_x1": 137.08176, "r_y1": 569.37544, "r_x2": 137.08176, "r_y2": 561.35948, "r_x3": 70.031021, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.9854, "r_y0": 569.37544, "r_x1": 172.38248, "r_y1": 569.37544, "r_x2": 172.38248, "r_y2": 561.35948, "r_x3": 145.9854, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7038, "r_y0": 569.37544, "r_x1": 286.36337, "r_y1": 569.37544, "r_x2": 286.36337, "r_y2": 561.35948, "r_x3": 178.7038, "r_y3": 561.35948, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 580.33444, "r_x1": 221.00723, "r_y1": 580.33444, "r_x2": 221.00723, "r_y2": 572.31848, "r_x3": 70.031021, "r_y3": 572.31848, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54300999999998, "r_y0": 580.12822, "r_x1": 286.35938, "r_y1": 580.12822, "r_x2": 286.35938, "r_y2": 572.39919, "r_x3": 232.54300999999998, "r_y3": 572.39919, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 591.08722, "r_x1": 135.53058, "r_y1": 591.08722, "r_x2": 135.53058, "r_y2": 583.35818, "r_x3": 70.031021, "r_y3": 583.35818, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53003, "r_y0": 591.29344, "r_x1": 167.89876, "r_y1": 591.29344, "r_x2": 167.89876, "r_y2": 583.27748, "r_x3": 135.53003, "r_y3": 583.27748, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3" }, { "label": "list_item", "id": 10, "page_no": 9, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.11203, "t": 594.60149, "r": 286.3634, "b": 635.49445, "coord_origin": "TOPLEFT" }, "confidence": 0.8360886573791504, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11203, "r_y0": 602.61745, "r_x1": 65.23661, "r_y1": 602.61745, "r_x2": 65.23661, "r_y2": 594.60149, "r_x3": 50.11203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.506203, "r_y0": 602.61745, "r_x1": 286.3587, "r_y1": 602.61745, "r_x2": 286.3587, "r_y2": 594.60149, "r_x3": 67.506203, "r_y3": 594.60149, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 613.57645, "r_x1": 109.1066, "r_y1": 613.57645, "r_x2": 109.1066, "r_y2": 605.56049, "r_x3": 70.031029, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.22592, "r_y0": 613.57645, "r_x1": 271.76605, "r_y1": 613.57645, "r_x2": 271.76605, "r_y2": 605.56049, "r_x3": 116.22592, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89435, "r_y0": 613.57645, "r_x1": 286.36337, "r_y1": 613.57645, "r_x2": 286.36337, "r_y2": 605.56049, "r_x3": 278.89435, "r_y3": 605.56049, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 624.32922, "r_x1": 286.3634, "r_y1": 624.32922, "r_x2": 286.3634, "r_y2": 616.60019, "r_x3": 70.031029, "r_y3": 616.60019, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031029, "r_y0": 635.28822, "r_x1": 139.09921, "r_y1": 635.28822, "r_x2": 139.09921, "r_y2": 627.55919, "r_x3": 70.031029, "r_y3": 627.55919, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.09802, "r_y0": 635.49445, "r_x1": 238.95683, "r_y1": 635.49445, "r_x2": 238.95683, "r_y2": 627.47849, "r_x3": 139.09802, "r_y3": 627.47849, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4" }, { "label": "list_item", "id": 12, "page_no": 9, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 50.112022, "t": 638.80249, "r": 286.36337, "b": 690.65347, "coord_origin": "TOPLEFT" }, "confidence": 0.8079474568367004, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112022, "r_y0": 646.81845, "r_x1": 65.203552, "r_y1": 646.81845, "r_x2": 65.203552, "r_y2": 638.80249, "r_x3": 50.112022, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.468193, "r_y0": 646.81845, "r_x1": 286.35873, "r_y1": 646.81845, "r_x2": 286.35873, "r_y2": 638.80249, "r_x3": 67.468193, "r_y3": 638.80249, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 657.77646, "r_x1": 286.36337, "r_y1": 657.77646, "r_x2": 286.36337, "r_y2": 649.7605, "r_x3": 70.031021, "r_y3": 649.7605, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 668.73547, "r_x1": 286.36334, "r_y1": 668.73547, "r_x2": 286.36334, "r_y2": 660.7195, "r_x3": 70.031021, "r_y3": 660.7195, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031021, "r_y0": 679.69447, "r_x1": 158.45766, "r_y1": 679.69447, "r_x2": 158.45766, "r_y2": 671.6785, "r_x3": 70.031021, "r_y3": 671.6785, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.52802, "r_y0": 679.48824, "r_x1": 286.36249, "r_y1": 679.48824, "r_x2": 286.36249, "r_y2": 671.7592, "r_x3": 160.52802, "r_y3": 671.7592, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 690.44724, "r_x1": 171.42305, "r_y1": 690.44724, "r_x2": 171.42305, "r_y2": 682.7182, "r_x3": 70.031013, "r_y3": 682.7182, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42201, "r_y0": 690.65347, "r_x1": 212.75713, "r_y1": 690.65347, "r_x2": 212.75713, "r_y2": 682.6375, "r_x3": 171.42201, "r_y3": 682.6375, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 9, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.112015, "t": 693.961502, "r": 286.36334, "b": 712.936462, "coord_origin": "TOPLEFT" }, "confidence": 0.8385783433914185, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112015, "r_y0": 701.977463, "r_x1": 66.506706, "r_y1": 701.977463, "r_x2": 66.506706, "r_y2": 693.961502, "r_x3": 50.112015, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.966896, "r_y0": 701.977463, "r_x1": 80.992294, "r_y1": 701.977463, "r_x2": 80.992294, "r_y2": 693.961502, "r_x3": 68.966896, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.062057, "r_y0": 701.977463, "r_x1": 114.71492999999998, "r_y1": 701.977463, "r_x2": 114.71492999999998, "r_y2": 693.961502, "r_x3": 89.062057, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.24621000000002, "r_y0": 701.977463, "r_x1": 149.1459, "r_y1": 701.977463, "r_x2": 149.1459, "r_y2": 693.961502, "r_x3": 124.24621000000002, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22462, "r_y0": 701.977463, "r_x1": 209.37321, "r_y1": 701.977463, "r_x2": 209.37321, "r_y2": 693.961502, "r_x3": 157.22462, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9045, "r_y0": 701.977463, "r_x1": 231.85196999999997, "r_y1": 701.977463, "r_x2": 231.85196999999997, "r_y2": 693.961502, "r_x3": 218.9045, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93069, "r_y0": 701.977463, "r_x1": 269.32254, "r_y1": 701.977463, "r_x2": 269.32254, "r_y2": 693.961502, "r_x3": 239.93069, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.3923, "r_y0": 701.977463, "r_x1": 286.3587, "r_y1": 701.977463, "r_x2": 286.3587, "r_y2": 693.961502, "r_x3": 277.3923, "r_y3": 693.961502, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.031013, "r_y0": 712.936462, "r_x1": 286.36334, "r_y1": 712.936462, "r_x2": 286.36334, "r_y2": 704.920502, "r_x3": 70.031013, "r_y3": 704.920502, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model," }, { "label": "list_item", "id": 14, "page_no": 9, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 328.78101, "t": 75.88347999999996, "r": 545.11456, "b": 116.77544999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.7556979060173035, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 83.89948000000015, "r_x1": 545.11346, "r_y1": 83.89948000000015, "r_x2": 545.11346, "r_y2": 75.88347999999996, "r_x3": 328.78101, "r_y3": 75.88347999999996, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 94.85748000000001, "r_x1": 472.30618, "r_y1": 94.85748000000001, "r_x2": 472.30618, "r_y2": 86.84149000000002, "r_x3": 328.78101, "r_y3": 86.84149000000002, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.88501, "r_y0": 94.65125, "r_x1": 545.11456, "r_y1": 94.65125, "r_x2": 545.11456, "r_y2": 86.92218000000003, "r_x3": 475.88501, "r_y3": 86.92218000000003, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 105.61023, "r_x1": 371.92734, "r_y1": 105.61023, "r_x2": 371.92734, "r_y2": 97.88116000000002, "r_x3": 328.78101, "r_y3": 97.88116000000002, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.92599, "r_y0": 105.81646999999987, "r_x1": 545.11206, "r_y1": 105.81646999999987, "r_x2": 545.11206, "r_y2": 97.80048, "r_x3": 371.92599, "r_y3": 97.80048, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 116.77544999999998, "r_x1": 417.70087, "r_y1": 116.77544999999998, "r_x2": 417.70087, "r_y2": 108.75945999999999, "r_x3": 328.78101, "r_y3": 108.75945999999999, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7" }, { "label": "list_item", "id": 9, "page_no": 9, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 120.71447999999998, "r": 545.11334, "b": 161.60742000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.8375797271728516, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 128.73046999999997, "r_x1": 324.33197, "r_y1": 128.73046999999997, "r_x2": 324.33197, "r_y2": 120.71447999999998, "r_x3": 308.862, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65341, "r_y0": 128.73046999999997, "r_x1": 545.10876, "r_y1": 128.73046999999997, "r_x2": 545.10876, "r_y2": 120.71447999999998, "r_x3": 326.65341, "r_y3": 120.71447999999998, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 139.68944999999997, "r_x1": 545.11334, "r_y1": 139.68944999999997, "r_x2": 545.11334, "r_y2": 131.67345999999998, "r_x3": 328.78101, "r_y3": 131.67345999999998, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 150.44219999999996, "r_x1": 545.11328, "r_y1": 150.44219999999996, "r_x2": 545.11328, "r_y2": 142.71312999999998, "r_x3": 328.78101, "r_y3": 142.71312999999998, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78101, "r_y0": 161.40117999999995, "r_x1": 406.32245, "r_y1": 161.40117999999995, "r_x2": 406.32245, "r_y2": 153.67211999999995, "r_x3": 328.78101, "r_y3": 153.67211999999995, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32202, "r_y0": 161.60742000000005, "r_x1": 506.18085, "r_y1": 161.60742000000005, "r_x2": 506.18085, "r_y2": 153.59142999999995, "r_x3": 406.32202, "r_y3": 153.59142999999995, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1" } ], "headers": [ { "label": "page_footer", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.1329920000001, "r": 302.59259, "b": 743.039555, "coord_origin": "TOPLEFT" }, "confidence": 0.9069584012031555, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.039555, "r_x1": 302.59259, "r_y1": 743.039555, "r_x2": 302.59259, "r_y2": 734.1329920000001, "r_x3": 292.63, "r_y3": 734.1329920000001, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" } ] } }, { "page_no": 10, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.842, "r_y0": 121.32263, "r_x1": 465.37591999999995, "r_y1": 121.32263, "r_x2": 465.37591999999995, "r_y2": 110.57488999999998, "r_x3": 132.842, "r_y3": 110.57488999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18399, "r_y0": 135.53008999999997, "r_x1": 375.04269, "r_y1": 135.53008999999997, "r_x2": 375.04269, "r_y2": 122.25982999999997, "r_x3": 220.18399, "r_y3": 122.25982999999997, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 171.90863000000002, "r_x1": 57.089828, "r_y1": 171.90863000000002, "r_x2": 57.089828, "r_y2": 161.16089, "r_x3": 50.111984, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.393616, "r_y0": 171.90863000000002, "r_x1": 175.96437, "r_y1": 171.90863000000002, "r_x2": 175.96437, "r_y2": 161.16089, "r_x3": 66.393616, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 190.83136000000002, "r_x1": 64.210808, "r_y1": 190.83136000000002, "r_x2": 64.210808, "r_y2": 180.97931000000005, "r_x3": 50.111984, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.610023, "r_y0": 190.83136000000002, "r_x1": 150.36401, "r_y1": 190.83136000000002, "r_x2": 150.36401, "r_y2": 180.97931000000005, "r_x3": 73.610023, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 208.82683999999995, "r_x1": 286.36496, "r_y1": 208.82683999999995, "r_x2": 286.36496, "r_y2": 199.92029000000002, "r_x3": 62.06698600000001, "r_y3": 199.92029000000002, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 220.78283999999996, "r_x1": 286.36505, "r_y1": 220.78283999999996, "r_x2": 286.36505, "r_y2": 211.87627999999995, "r_x3": 50.111984, "r_y3": 211.87627999999995, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 232.73784999999998, "r_x1": 286.36514, "r_y1": 232.73784999999998, "r_x2": 286.36514, "r_y2": 223.83130000000006, "r_x3": 50.111984, "r_y3": 223.83130000000006, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 244.69286999999997, "r_x1": 286.36508, "r_y1": 244.69286999999997, "r_x2": 286.36508, "r_y2": 235.78632000000005, "r_x3": 50.111984, "r_y3": 235.78632000000005, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 256.64788999999996, "r_x1": 286.36505, "r_y1": 256.64788999999996, "r_x2": 286.36505, "r_y2": 247.74132999999995, "r_x3": 50.111984, "r_y3": 247.74132999999995, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 268.60290999999995, "r_x1": 286.36505, "r_y1": 268.60290999999995, "r_x2": 286.36505, "r_y2": 259.69635000000005, "r_x3": 50.111984, "r_y3": 259.69635000000005, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 280.55792, "r_x1": 286.36505, "r_y1": 280.55792, "r_x2": 286.36505, "r_y2": 271.65137000000004, "r_x3": 50.111984, "r_y3": 271.65137000000004, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 292.5139199999999, "r_x1": 286.36502, "r_y1": 292.5139199999999, "r_x2": 286.36502, "r_y2": 283.60736, "r_x3": 50.111984, "r_y3": 283.60736, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 304.4689, "r_x1": 286.36505, "r_y1": 304.4689, "r_x2": 286.36505, "r_y2": 295.56235, "r_x3": 50.111984, "r_y3": 295.56235, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 316.42389, "r_x1": 286.36508, "r_y1": 316.42389, "r_x2": 286.36508, "r_y2": 307.5173300000001, "r_x3": 50.111984, "r_y3": 307.5173300000001, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 328.3788799999999, "r_x1": 286.36505, "r_y1": 328.3788799999999, "r_x2": 286.36505, "r_y2": 319.47232, "r_x3": 50.111984, "r_y3": 319.47232, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 340.33386, "r_x1": 286.36502, "r_y1": 340.33386, "r_x2": 286.36502, "r_y2": 331.42731000000003, "r_x3": 50.111984, "r_y3": 331.42731000000003, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 352.28986, "r_x1": 286.36508, "r_y1": 352.28986, "r_x2": 286.36508, "r_y2": 343.3833, "r_x3": 50.111984, "r_y3": 343.3833, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 364.24484000000007, "r_x1": 286.36505, "r_y1": 364.24484000000007, "r_x2": 286.36505, "r_y2": 355.33829, "r_x3": 50.111984, "r_y3": 355.33829, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 376.19983, "r_x1": 286.36508, "r_y1": 376.19983, "r_x2": 286.36508, "r_y2": 367.29327, "r_x3": 50.111984, "r_y3": 367.29327, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 388.15482000000003, "r_x1": 230.80364999999998, "r_y1": 388.15482000000003, "r_x2": 230.80364999999998, "r_y2": 379.24826, "r_x3": 50.111984, "r_y3": 379.24826, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 400.31183, "r_x1": 286.36499, "r_y1": 400.31183, "r_x2": 286.36499, "r_y2": 391.40527, "r_x3": 62.06698600000001, "r_y3": 391.40527, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 412.26681999999994, "r_x1": 286.36508, "r_y1": 412.26681999999994, "r_x2": 286.36508, "r_y2": 403.36026, "r_x3": 50.111984, "r_y3": 403.36026, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 424.22180000000003, "r_x1": 286.36505, "r_y1": 424.22180000000003, "r_x2": 286.36505, "r_y2": 415.31525, "r_x3": 50.111984, "r_y3": 415.31525, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 436.1778, "r_x1": 286.36505, "r_y1": 436.1778, "r_x2": 286.36505, "r_y2": 427.2712399999999, "r_x3": 50.111984, "r_y3": 427.2712399999999, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 448.1327800000001, "r_x1": 286.36508, "r_y1": 448.1327800000001, "r_x2": 286.36508, "r_y2": 439.22623, "r_x3": 50.111984, "r_y3": 439.22623, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 460.08777, "r_x1": 286.36511, "r_y1": 460.08777, "r_x2": 286.36511, "r_y2": 451.18121, "r_x3": 50.111984, "r_y3": 451.18121, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 472.04276, "r_x1": 286.36505, "r_y1": 472.04276, "r_x2": 286.36505, "r_y2": 463.1362, "r_x3": 50.111984, "r_y3": 463.1362, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 483.99774, "r_x1": 286.36508, "r_y1": 483.99774, "r_x2": 286.36508, "r_y2": 475.09119, "r_x3": 50.111984, "r_y3": 475.09119, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 495.95273, "r_x1": 286.36502, "r_y1": 495.95273, "r_x2": 286.36502, "r_y2": 487.04617, "r_x3": 50.111984, "r_y3": 487.04617, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 507.90872, "r_x1": 286.36511, "r_y1": 507.90872, "r_x2": 286.36511, "r_y2": 499.00217, "r_x3": 50.111984, "r_y3": 499.00217, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 519.8637100000001, "r_x1": 286.36508, "r_y1": 519.8637100000001, "r_x2": 286.36508, "r_y2": 510.95715, "r_x3": 50.111984, "r_y3": 510.95715, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 531.8187, "r_x1": 286.36508, "r_y1": 531.8187, "r_x2": 286.36508, "r_y2": 522.91214, "r_x3": 50.111984, "r_y3": 522.91214, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 543.7737, "r_x1": 286.36505, "r_y1": 543.7737, "r_x2": 286.36505, "r_y2": 534.86713, "r_x3": 50.111984, "r_y3": 534.86713, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 555.7287, "r_x1": 286.36502, "r_y1": 555.7287, "r_x2": 286.36502, "r_y2": 546.82214, "r_x3": 50.111984, "r_y3": 546.82214, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 567.68469, "r_x1": 257.47351, "r_y1": 567.68469, "r_x2": 257.47351, "r_y2": 558.77814, "r_x3": 50.111984, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.94919, "r_y0": 567.68469, "r_x1": 286.36505, "r_y1": 567.68469, "r_x2": 286.36505, "r_y2": 558.77814, "r_x3": 263.94919, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 579.63969, "r_x1": 286.36508, "r_y1": 579.63969, "r_x2": 286.36508, "r_y2": 570.73314, "r_x3": 50.111984, "r_y3": 570.73314, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 591.5947, "r_x1": 286.36511, "r_y1": 591.5947, "r_x2": 286.36511, "r_y2": 582.68814, "r_x3": 50.111984, "r_y3": 582.68814, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 603.5497, "r_x1": 286.36511, "r_y1": 603.5497, "r_x2": 286.36511, "r_y2": 594.64314, "r_x3": 50.111984, "r_y3": 594.64314, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 615.5047, "r_x1": 286.36505, "r_y1": 615.5047, "r_x2": 286.36505, "r_y2": 606.5981400000001, "r_x3": 50.111984, "r_y3": 606.5981400000001, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 627.4597, "r_x1": 242.2606, "r_y1": 627.4597, "r_x2": 242.2606, "r_y2": 618.55315, "r_x3": 50.111984, "r_y3": 618.55315, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 639.6167, "r_x1": 286.36496, "r_y1": 639.6167, "r_x2": 286.36496, "r_y2": 630.71014, "r_x3": 62.06698600000001, "r_y3": 630.71014, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 651.57269, "r_x1": 179.90472, "r_y1": 651.57269, "r_x2": 179.90472, "r_y2": 642.66614, "r_x3": 50.111984, "r_y3": 642.66614, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 672.24219, "r_x1": 64.297272, "r_y1": 672.24219, "r_x2": 64.297272, "r_y2": 662.39014, "r_x3": 50.111984, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.754135, "r_y0": 672.24219, "r_x1": 153.60785, "r_y1": 672.24219, "r_x2": 153.60785, "r_y2": 662.39014, "r_x3": 73.754135, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 690.2377, "r_x1": 286.36493, "r_y1": 690.2377, "r_x2": 286.36493, "r_y2": 681.33113, "r_x3": 62.06698600000001, "r_y3": 681.33113, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 702.1927029999999, "r_x1": 286.36505, "r_y1": 702.1927029999999, "r_x2": 286.36505, "r_y2": 693.2861330000001, "r_x3": 50.111984, "r_y3": 693.2861330000001, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 714.147705, "r_x1": 84.144226, "r_y1": 714.147705, "r_x2": 84.144226, "r_y2": 705.241135, "r_x3": 50.111984, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.237595, "r_y0": 714.147705, "r_x1": 286.36505, "r_y1": 714.147705, "r_x2": 286.36505, "r_y2": 705.241135, "r_x3": 91.237595, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 171.56170999999995, "r_x1": 545.11511, "r_y1": 171.56170999999995, "r_x2": 545.11511, "r_y2": 162.65515000000005, "r_x3": 308.862, "r_y3": 162.65515000000005, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.51671999999996, "r_x1": 545.11511, "r_y1": 183.51671999999996, "r_x2": 545.11511, "r_y2": 174.61017000000004, "r_x3": 308.862, "r_y3": 174.61017000000004, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 195.47173999999995, "r_x1": 545.11511, "r_y1": 195.47173999999995, "r_x2": 545.11511, "r_y2": 186.56519000000003, "r_x3": 308.862, "r_y3": 186.56519000000003, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 207.42773, "r_x1": 484.07434, "r_y1": 207.42773, "r_x2": 484.07434, "r_y2": 198.52117999999996, "r_x3": 308.862, "r_y3": 198.52117999999996, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 220.14171999999996, "r_x1": 545.11505, "r_y1": 220.14171999999996, "r_x2": 545.11505, "r_y2": 211.23517000000004, "r_x3": 320.81699, "r_y3": 211.23517000000004, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 232.09673999999995, "r_x1": 448.08939, "r_y1": 232.09673999999995, "r_x2": 448.08939, "r_y2": 223.19019000000003, "r_x3": 308.862, "r_y3": 223.19019000000003, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 244.81177000000002, "r_x1": 328.28894, "r_y1": 244.81177000000002, "r_x2": 328.28894, "r_y2": 235.90521, "r_x3": 320.81699, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38232, "r_y0": 244.81177000000002, "r_x1": 545.11499, "r_y1": 244.81177000000002, "r_x2": 545.11499, "r_y2": 235.90521, "r_x3": 335.38232, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 256.76678000000004, "r_x1": 545.11511, "r_y1": 256.76678000000004, "r_x2": 545.11511, "r_y2": 247.86023, "r_x3": 308.862, "r_y3": 247.86023, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 268.72180000000003, "r_x1": 545.11511, "r_y1": 268.72180000000003, "r_x2": 545.11511, "r_y2": 259.81525, "r_x3": 308.862, "r_y3": 259.81525, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 280.67682, "r_x1": 393.3847, "r_y1": 280.67682, "r_x2": 393.3847, "r_y2": 271.77026, "r_x3": 308.862, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.11942, "r_y0": 280.67682, "r_x1": 545.11511, "r_y1": 280.67682, "r_x2": 545.11511, "r_y2": 271.77026, "r_x3": 400.11942, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 292.63181, "r_x1": 545.11505, "r_y1": 292.63181, "r_x2": 545.11505, "r_y2": 283.72524999999996, "r_x3": 308.862, "r_y3": 283.72524999999996, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 304.5878000000001, "r_x1": 545.11511, "r_y1": 304.5878000000001, "r_x2": 545.11511, "r_y2": 295.68124, "r_x3": 308.862, "r_y3": 295.68124, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 316.54279, "r_x1": 425.69348, "r_y1": 316.54279, "r_x2": 425.69348, "r_y2": 307.63623, "r_x3": 308.862, "r_y3": 307.63623, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 329.25677, "r_x1": 328.4949, "r_y1": 329.25677, "r_x2": 328.4949, "r_y2": 320.35022, "r_x3": 320.81699, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05423, "r_y0": 329.25677, "r_x1": 545.11499, "r_y1": 329.25677, "r_x2": 545.11499, "r_y2": 320.35022, "r_x3": 331.05423, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 341.21176, "r_x1": 545.11517, "r_y1": 341.21176, "r_x2": 545.11517, "r_y2": 332.30521000000005, "r_x3": 308.862, "r_y3": 332.30521000000005, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 353.16675, "r_x1": 545.11505, "r_y1": 353.16675, "r_x2": 545.11505, "r_y2": 344.26018999999997, "r_x3": 308.862, "r_y3": 344.26018999999997, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 365.12273999999996, "r_x1": 545.11511, "r_y1": 365.12273999999996, "r_x2": 545.11511, "r_y2": 356.21619, "r_x3": 308.862, "r_y3": 356.21619, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 377.07773, "r_x1": 545.11511, "r_y1": 377.07773, "r_x2": 545.11511, "r_y2": 368.17117, "r_x3": 308.862, "r_y3": 368.17117, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 389.03271, "r_x1": 545.11499, "r_y1": 389.03271, "r_x2": 545.11499, "r_y2": 380.12616, "r_x3": 308.862, "r_y3": 380.12616, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.98769999999996, "r_x1": 545.11517, "r_y1": 400.98769999999996, "r_x2": 545.11517, "r_y2": 392.08115, "r_x3": 308.862, "r_y3": 392.08115, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.94269, "r_x1": 545.11511, "r_y1": 412.94269, "r_x2": 545.11511, "r_y2": 404.03613000000007, "r_x3": 308.862, "r_y3": 404.03613000000007, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.89767, "r_x1": 545.11499, "r_y1": 424.89767, "r_x2": 545.11499, "r_y2": 415.99112, "r_x3": 308.862, "r_y3": 415.99112, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.85367, "r_x1": 545.11517, "r_y1": 436.85367, "r_x2": 545.11517, "r_y2": 427.94711, "r_x3": 308.862, "r_y3": 427.94711, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.80865, "r_x1": 345.94278, "r_y1": 448.80865, "r_x2": 345.94278, "r_y2": 439.9021, "r_x3": 308.862, "r_y3": 439.9021, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 461.52264, "r_x1": 328.30341, "r_y1": 461.52264, "r_x2": 328.30341, "r_y2": 452.61609, "r_x3": 320.81699, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.79889, "r_y0": 461.52264, "r_x1": 485.75772000000006, "r_y1": 461.52264, "r_x2": 485.75772000000006, "r_y2": 452.61609, "r_x3": 330.79889, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.073, "r_y0": 461.29352, "r_x1": 511.86368, "r_y1": 461.29352, "r_x2": 511.86368, "r_y2": 452.70575, "r_x3": 488.073, "r_y3": 452.70575, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86301, "r_y0": 461.52264, "r_x1": 545.10815, "r_y1": 461.52264, "r_x2": 545.10815, "r_y2": 452.61609, "r_x3": 511.86301, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 473.47763, "r_x1": 545.11505, "r_y1": 473.47763, "r_x2": 545.11505, "r_y2": 464.57108, "r_x3": 308.862, "r_y3": 464.57108, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 485.43362, "r_x1": 545.11517, "r_y1": 485.43362, "r_x2": 545.11517, "r_y2": 476.52707, "r_x3": 308.862, "r_y3": 476.52707, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.38861, "r_x1": 379.14816, "r_y1": 497.38861, "r_x2": 379.14816, "r_y2": 488.48206, "r_x3": 308.862, "r_y3": 488.48206, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 510.1026, "r_x1": 328.66177, "r_y1": 510.1026, "r_x2": 328.66177, "r_y2": 501.19604, "r_x3": 320.81699, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2767, "r_y0": 510.1026, "r_x1": 545.11493, "r_y1": 510.1026, "r_x2": 545.11493, "r_y2": 501.19604, "r_x3": 331.2767, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 522.05759, "r_x1": 545.1153, "r_y1": 522.05759, "r_x2": 545.1153, "r_y2": 513.15103, "r_x3": 308.862, "r_y3": 513.15103, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 534.01358, "r_x1": 384.29883, "r_y1": 534.01358, "r_x2": 384.29883, "r_y2": 525.10703, "r_x3": 308.862, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25272, "r_y0": 534.01358, "r_x1": 545.11511, "r_y1": 534.01358, "r_x2": 545.11511, "r_y2": 525.10703, "r_x3": 391.25272, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.96858, "r_x1": 496.15897000000007, "r_y1": 545.96858, "r_x2": 496.15897000000007, "r_y2": 537.06203, "r_x3": 308.862, "r_y3": 537.06203, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 558.68259, "r_x1": 328.28894, "r_y1": 558.68259, "r_x2": 328.28894, "r_y2": 549.77603, "r_x3": 320.81699, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.40222, "r_y0": 558.68259, "r_x1": 545.11499, "r_y1": 558.68259, "r_x2": 545.11499, "r_y2": 549.77603, "r_x3": 335.40222, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 570.63759, "r_x1": 545.11517, "r_y1": 570.63759, "r_x2": 545.11517, "r_y2": 561.73103, "r_x3": 308.862, "r_y3": 561.73103, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 582.59259, "r_x1": 545.11511, "r_y1": 582.59259, "r_x2": 545.11511, "r_y2": 573.68604, "r_x3": 308.862, "r_y3": 573.68604, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 594.54858, "r_x1": 545.11505, "r_y1": 594.54858, "r_x2": 545.11505, "r_y2": 585.64203, "r_x3": 308.862, "r_y3": 585.64203, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 606.50359, "r_x1": 341.2305, "r_y1": 606.50359, "r_x2": 341.2305, "r_y2": 597.59703, "r_x3": 308.862, "r_y3": 597.59703, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 633.03831, "r_x1": 316.76675, "r_y1": 633.03831, "r_x2": 316.76675, "r_y2": 622.2905900000001, "r_x3": 308.862, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.30643, "r_y0": 633.03831, "r_x1": 545.10876, "r_y1": 633.03831, "r_x2": 545.10876, "r_y2": 622.2905900000001, "r_x3": 327.30643, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 646.98631, "r_x1": 357.34055, "r_y1": 646.98631, "r_x2": 357.34055, "r_y2": 636.2385899999999, "r_x3": 326.79501, "r_y3": 636.2385899999999, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 666.3276, "r_x1": 545.11499, "r_y1": 666.3276, "r_x2": 545.11499, "r_y2": 657.42104, "r_x3": 320.81702, "r_y3": 657.42104, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 678.2826, "r_x1": 545.11511, "r_y1": 678.2826, "r_x2": 545.11511, "r_y2": 669.37604, "r_x3": 308.86203, "r_y3": 669.37604, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 690.2376, "r_x1": 545.11517, "r_y1": 690.2376, "r_x2": 545.11517, "r_y2": 681.33104, "r_x3": 308.86203, "r_y3": 681.33104, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 702.1926040000001, "r_x1": 545.11505, "r_y1": 702.1926040000001, "r_x2": 545.11505, "r_y2": 693.286041, "r_x3": 308.86203, "r_y3": 693.286041, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 714.148605, "r_x1": 371.42719, "r_y1": 714.148605, "r_x2": 371.42719, "r_y2": 705.242035, "r_x3": 308.86203, "r_y3": 705.242035, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63104, "r_y0": 743.0396, "r_x1": 302.59363, "r_y1": 743.0396, "r_x2": 302.59363, "r_y2": 734.1330379999999, "r_x3": 292.63104, "r_y3": 734.1330379999999, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 18, "label": "section_header", "bbox": { "l": 132.842, "t": 110.57488999999998, "r": 465.37591999999995, "b": 135.53008999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.6497084498405457, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.842, "r_y0": 121.32263, "r_x1": 465.37591999999995, "r_y1": 121.32263, "r_x2": 465.37591999999995, "r_y2": 110.57488999999998, "r_x3": 132.842, "r_y3": 110.57488999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18399, "r_y0": 135.53008999999997, "r_x1": 375.04269, "r_y1": 135.53008999999997, "r_x2": 375.04269, "r_y2": 122.25982999999997, "r_x3": 220.18399, "r_y3": 122.25982999999997, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 50.111984, "t": 161.16089, "r": 175.96437, "b": 171.90863000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9454860091209412, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 171.90863000000002, "r_x1": 57.089828, "r_y1": 171.90863000000002, "r_x2": 57.089828, "r_y2": 161.16089, "r_x3": 50.111984, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.393616, "r_y0": 171.90863000000002, "r_x1": 175.96437, "r_y1": 171.90863000000002, "r_x2": 175.96437, "r_y2": 161.16089, "r_x3": 66.393616, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "section_header", "bbox": { "l": 50.111984, "t": 180.97931000000005, "r": 150.36401, "b": 190.83136000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9535645842552185, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 190.83136000000002, "r_x1": 64.210808, "r_y1": 190.83136000000002, "r_x2": 64.210808, "r_y2": 180.97931000000005, "r_x3": 50.111984, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.610023, "r_y0": 190.83136000000002, "r_x1": 150.36401, "r_y1": 190.83136000000002, "r_x2": 150.36401, "r_y2": 180.97931000000005, "r_x3": 73.610023, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 50.111984, "t": 199.92029000000002, "r": 286.36514, "b": 388.15482000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9864971041679382, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 208.82683999999995, "r_x1": 286.36496, "r_y1": 208.82683999999995, "r_x2": 286.36496, "r_y2": 199.92029000000002, "r_x3": 62.06698600000001, "r_y3": 199.92029000000002, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 220.78283999999996, "r_x1": 286.36505, "r_y1": 220.78283999999996, "r_x2": 286.36505, "r_y2": 211.87627999999995, "r_x3": 50.111984, "r_y3": 211.87627999999995, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 232.73784999999998, "r_x1": 286.36514, "r_y1": 232.73784999999998, "r_x2": 286.36514, "r_y2": 223.83130000000006, "r_x3": 50.111984, "r_y3": 223.83130000000006, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 244.69286999999997, "r_x1": 286.36508, "r_y1": 244.69286999999997, "r_x2": 286.36508, "r_y2": 235.78632000000005, "r_x3": 50.111984, "r_y3": 235.78632000000005, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 256.64788999999996, "r_x1": 286.36505, "r_y1": 256.64788999999996, "r_x2": 286.36505, "r_y2": 247.74132999999995, "r_x3": 50.111984, "r_y3": 247.74132999999995, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 268.60290999999995, "r_x1": 286.36505, "r_y1": 268.60290999999995, "r_x2": 286.36505, "r_y2": 259.69635000000005, "r_x3": 50.111984, "r_y3": 259.69635000000005, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 280.55792, "r_x1": 286.36505, "r_y1": 280.55792, "r_x2": 286.36505, "r_y2": 271.65137000000004, "r_x3": 50.111984, "r_y3": 271.65137000000004, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 292.5139199999999, "r_x1": 286.36502, "r_y1": 292.5139199999999, "r_x2": 286.36502, "r_y2": 283.60736, "r_x3": 50.111984, "r_y3": 283.60736, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 304.4689, "r_x1": 286.36505, "r_y1": 304.4689, "r_x2": 286.36505, "r_y2": 295.56235, "r_x3": 50.111984, "r_y3": 295.56235, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 316.42389, "r_x1": 286.36508, "r_y1": 316.42389, "r_x2": 286.36508, "r_y2": 307.5173300000001, "r_x3": 50.111984, "r_y3": 307.5173300000001, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 328.3788799999999, "r_x1": 286.36505, "r_y1": 328.3788799999999, "r_x2": 286.36505, "r_y2": 319.47232, "r_x3": 50.111984, "r_y3": 319.47232, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 340.33386, "r_x1": 286.36502, "r_y1": 340.33386, "r_x2": 286.36502, "r_y2": 331.42731000000003, "r_x3": 50.111984, "r_y3": 331.42731000000003, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 352.28986, "r_x1": 286.36508, "r_y1": 352.28986, "r_x2": 286.36508, "r_y2": 343.3833, "r_x3": 50.111984, "r_y3": 343.3833, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 364.24484000000007, "r_x1": 286.36505, "r_y1": 364.24484000000007, "r_x2": 286.36505, "r_y2": 355.33829, "r_x3": 50.111984, "r_y3": 355.33829, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 376.19983, "r_x1": 286.36508, "r_y1": 376.19983, "r_x2": 286.36508, "r_y2": 367.29327, "r_x3": 50.111984, "r_y3": 367.29327, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 388.15482000000003, "r_x1": 230.80364999999998, "r_y1": 388.15482000000003, "r_x2": 230.80364999999998, "r_y2": 379.24826, "r_x3": 50.111984, "r_y3": 379.24826, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.111984, "t": 391.40527, "r": 286.36511, "b": 627.4597, "coord_origin": "TOPLEFT" }, "confidence": 0.9826022386550903, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 400.31183, "r_x1": 286.36499, "r_y1": 400.31183, "r_x2": 286.36499, "r_y2": 391.40527, "r_x3": 62.06698600000001, "r_y3": 391.40527, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 412.26681999999994, "r_x1": 286.36508, "r_y1": 412.26681999999994, "r_x2": 286.36508, "r_y2": 403.36026, "r_x3": 50.111984, "r_y3": 403.36026, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 424.22180000000003, "r_x1": 286.36505, "r_y1": 424.22180000000003, "r_x2": 286.36505, "r_y2": 415.31525, "r_x3": 50.111984, "r_y3": 415.31525, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 436.1778, "r_x1": 286.36505, "r_y1": 436.1778, "r_x2": 286.36505, "r_y2": 427.2712399999999, "r_x3": 50.111984, "r_y3": 427.2712399999999, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 448.1327800000001, "r_x1": 286.36508, "r_y1": 448.1327800000001, "r_x2": 286.36508, "r_y2": 439.22623, "r_x3": 50.111984, "r_y3": 439.22623, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 460.08777, "r_x1": 286.36511, "r_y1": 460.08777, "r_x2": 286.36511, "r_y2": 451.18121, "r_x3": 50.111984, "r_y3": 451.18121, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 472.04276, "r_x1": 286.36505, "r_y1": 472.04276, "r_x2": 286.36505, "r_y2": 463.1362, "r_x3": 50.111984, "r_y3": 463.1362, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 483.99774, "r_x1": 286.36508, "r_y1": 483.99774, "r_x2": 286.36508, "r_y2": 475.09119, "r_x3": 50.111984, "r_y3": 475.09119, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 495.95273, "r_x1": 286.36502, "r_y1": 495.95273, "r_x2": 286.36502, "r_y2": 487.04617, "r_x3": 50.111984, "r_y3": 487.04617, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 507.90872, "r_x1": 286.36511, "r_y1": 507.90872, "r_x2": 286.36511, "r_y2": 499.00217, "r_x3": 50.111984, "r_y3": 499.00217, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 519.8637100000001, "r_x1": 286.36508, "r_y1": 519.8637100000001, "r_x2": 286.36508, "r_y2": 510.95715, "r_x3": 50.111984, "r_y3": 510.95715, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 531.8187, "r_x1": 286.36508, "r_y1": 531.8187, "r_x2": 286.36508, "r_y2": 522.91214, "r_x3": 50.111984, "r_y3": 522.91214, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 543.7737, "r_x1": 286.36505, "r_y1": 543.7737, "r_x2": 286.36505, "r_y2": 534.86713, "r_x3": 50.111984, "r_y3": 534.86713, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 555.7287, "r_x1": 286.36502, "r_y1": 555.7287, "r_x2": 286.36502, "r_y2": 546.82214, "r_x3": 50.111984, "r_y3": 546.82214, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 567.68469, "r_x1": 257.47351, "r_y1": 567.68469, "r_x2": 257.47351, "r_y2": 558.77814, "r_x3": 50.111984, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.94919, "r_y0": 567.68469, "r_x1": 286.36505, "r_y1": 567.68469, "r_x2": 286.36505, "r_y2": 558.77814, "r_x3": 263.94919, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 579.63969, "r_x1": 286.36508, "r_y1": 579.63969, "r_x2": 286.36508, "r_y2": 570.73314, "r_x3": 50.111984, "r_y3": 570.73314, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 591.5947, "r_x1": 286.36511, "r_y1": 591.5947, "r_x2": 286.36511, "r_y2": 582.68814, "r_x3": 50.111984, "r_y3": 582.68814, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 603.5497, "r_x1": 286.36511, "r_y1": 603.5497, "r_x2": 286.36511, "r_y2": 594.64314, "r_x3": 50.111984, "r_y3": 594.64314, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 615.5047, "r_x1": 286.36505, "r_y1": 615.5047, "r_x2": 286.36505, "r_y2": 606.5981400000001, "r_x3": 50.111984, "r_y3": 606.5981400000001, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 627.4597, "r_x1": 242.2606, "r_y1": 627.4597, "r_x2": 242.2606, "r_y2": 618.55315, "r_x3": 50.111984, "r_y3": 618.55315, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 50.111984, "t": 630.71014, "r": 286.36496, "b": 651.57269, "coord_origin": "TOPLEFT" }, "confidence": 0.9335853457450867, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 639.6167, "r_x1": 286.36496, "r_y1": 639.6167, "r_x2": 286.36496, "r_y2": 630.71014, "r_x3": 62.06698600000001, "r_y3": 630.71014, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 651.57269, "r_x1": 179.90472, "r_y1": 651.57269, "r_x2": 179.90472, "r_y2": 642.66614, "r_x3": 50.111984, "r_y3": 642.66614, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "section_header", "bbox": { "l": 50.111984, "t": 662.39014, "r": 153.60785, "b": 672.24219, "coord_origin": "TOPLEFT" }, "confidence": 0.9515743255615234, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 672.24219, "r_x1": 64.297272, "r_y1": 672.24219, "r_x2": 64.297272, "r_y2": 662.39014, "r_x3": 50.111984, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.754135, "r_y0": 672.24219, "r_x1": 153.60785, "r_y1": 672.24219, "r_x2": 153.60785, "r_y2": 662.39014, "r_x3": 73.754135, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.111984, "t": 681.33113, "r": 286.36505, "b": 714.147705, "coord_origin": "TOPLEFT" }, "confidence": 0.9783332347869873, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 690.2377, "r_x1": 286.36493, "r_y1": 690.2377, "r_x2": 286.36493, "r_y2": 681.33113, "r_x3": 62.06698600000001, "r_y3": 681.33113, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 702.1927029999999, "r_x1": 286.36505, "r_y1": 702.1927029999999, "r_x2": 286.36505, "r_y2": 693.2861330000001, "r_x3": 50.111984, "r_y3": 693.2861330000001, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 714.147705, "r_x1": 84.144226, "r_y1": 714.147705, "r_x2": 84.144226, "r_y2": 705.241135, "r_x3": 50.111984, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.237595, "r_y0": 714.147705, "r_x1": 286.36505, "r_y1": 714.147705, "r_x2": 286.36505, "r_y2": 705.241135, "r_x3": 91.237595, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 308.862, "t": 162.65515000000005, "r": 545.11511, "b": 207.42773, "coord_origin": "TOPLEFT" }, "confidence": 0.9596064686775208, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 171.56170999999995, "r_x1": 545.11511, "r_y1": 171.56170999999995, "r_x2": 545.11511, "r_y2": 162.65515000000005, "r_x3": 308.862, "r_y3": 162.65515000000005, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.51671999999996, "r_x1": 545.11511, "r_y1": 183.51671999999996, "r_x2": 545.11511, "r_y2": 174.61017000000004, "r_x3": 308.862, "r_y3": 174.61017000000004, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 195.47173999999995, "r_x1": 545.11511, "r_y1": 195.47173999999995, "r_x2": 545.11511, "r_y2": 186.56519000000003, "r_x3": 308.862, "r_y3": 186.56519000000003, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 207.42773, "r_x1": 484.07434, "r_y1": 207.42773, "r_x2": 484.07434, "r_y2": 198.52117999999996, "r_x3": 308.862, "r_y3": 198.52117999999996, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 308.862, "t": 211.23517000000004, "r": 545.11505, "b": 232.09673999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9261796474456787, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 220.14171999999996, "r_x1": 545.11505, "r_y1": 220.14171999999996, "r_x2": 545.11505, "r_y2": 211.23517000000004, "r_x3": 320.81699, "r_y3": 211.23517000000004, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 232.09673999999995, "r_x1": 448.08939, "r_y1": 232.09673999999995, "r_x2": 448.08939, "r_y2": 223.19019000000003, "r_x3": 308.862, "r_y3": 223.19019000000003, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 308.862, "t": 235.90521, "r": 545.11511, "b": 316.54279, "coord_origin": "TOPLEFT" }, "confidence": 0.9642952680587769, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 244.81177000000002, "r_x1": 328.28894, "r_y1": 244.81177000000002, "r_x2": 328.28894, "r_y2": 235.90521, "r_x3": 320.81699, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38232, "r_y0": 244.81177000000002, "r_x1": 545.11499, "r_y1": 244.81177000000002, "r_x2": 545.11499, "r_y2": 235.90521, "r_x3": 335.38232, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 256.76678000000004, "r_x1": 545.11511, "r_y1": 256.76678000000004, "r_x2": 545.11511, "r_y2": 247.86023, "r_x3": 308.862, "r_y3": 247.86023, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 268.72180000000003, "r_x1": 545.11511, "r_y1": 268.72180000000003, "r_x2": 545.11511, "r_y2": 259.81525, "r_x3": 308.862, "r_y3": 259.81525, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 280.67682, "r_x1": 393.3847, "r_y1": 280.67682, "r_x2": 393.3847, "r_y2": 271.77026, "r_x3": 308.862, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.11942, "r_y0": 280.67682, "r_x1": 545.11511, "r_y1": 280.67682, "r_x2": 545.11511, "r_y2": 271.77026, "r_x3": 400.11942, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 292.63181, "r_x1": 545.11505, "r_y1": 292.63181, "r_x2": 545.11505, "r_y2": 283.72524999999996, "r_x3": 308.862, "r_y3": 283.72524999999996, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 304.5878000000001, "r_x1": 545.11511, "r_y1": 304.5878000000001, "r_x2": 545.11511, "r_y2": 295.68124, "r_x3": 308.862, "r_y3": 295.68124, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 316.54279, "r_x1": 425.69348, "r_y1": 316.54279, "r_x2": 425.69348, "r_y2": 307.63623, "r_x3": 308.862, "r_y3": 307.63623, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 308.862, "t": 320.35022, "r": 545.11517, "b": 448.80865, "coord_origin": "TOPLEFT" }, "confidence": 0.9699994921684265, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 329.25677, "r_x1": 328.4949, "r_y1": 329.25677, "r_x2": 328.4949, "r_y2": 320.35022, "r_x3": 320.81699, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05423, "r_y0": 329.25677, "r_x1": 545.11499, "r_y1": 329.25677, "r_x2": 545.11499, "r_y2": 320.35022, "r_x3": 331.05423, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 341.21176, "r_x1": 545.11517, "r_y1": 341.21176, "r_x2": 545.11517, "r_y2": 332.30521000000005, "r_x3": 308.862, "r_y3": 332.30521000000005, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 353.16675, "r_x1": 545.11505, "r_y1": 353.16675, "r_x2": 545.11505, "r_y2": 344.26018999999997, "r_x3": 308.862, "r_y3": 344.26018999999997, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 365.12273999999996, "r_x1": 545.11511, "r_y1": 365.12273999999996, "r_x2": 545.11511, "r_y2": 356.21619, "r_x3": 308.862, "r_y3": 356.21619, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 377.07773, "r_x1": 545.11511, "r_y1": 377.07773, "r_x2": 545.11511, "r_y2": 368.17117, "r_x3": 308.862, "r_y3": 368.17117, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 389.03271, "r_x1": 545.11499, "r_y1": 389.03271, "r_x2": 545.11499, "r_y2": 380.12616, "r_x3": 308.862, "r_y3": 380.12616, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.98769999999996, "r_x1": 545.11517, "r_y1": 400.98769999999996, "r_x2": 545.11517, "r_y2": 392.08115, "r_x3": 308.862, "r_y3": 392.08115, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.94269, "r_x1": 545.11511, "r_y1": 412.94269, "r_x2": 545.11511, "r_y2": 404.03613000000007, "r_x3": 308.862, "r_y3": 404.03613000000007, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.89767, "r_x1": 545.11499, "r_y1": 424.89767, "r_x2": 545.11499, "r_y2": 415.99112, "r_x3": 308.862, "r_y3": 415.99112, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.85367, "r_x1": 545.11517, "r_y1": 436.85367, "r_x2": 545.11517, "r_y2": 427.94711, "r_x3": 308.862, "r_y3": 427.94711, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.80865, "r_x1": 345.94278, "r_y1": 448.80865, "r_x2": 345.94278, "r_y2": 439.9021, "r_x3": 308.862, "r_y3": 439.9021, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 452.61609, "r": 545.11517, "b": 497.38861, "coord_origin": "TOPLEFT" }, "confidence": 0.9568928480148315, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 461.52264, "r_x1": 328.30341, "r_y1": 461.52264, "r_x2": 328.30341, "r_y2": 452.61609, "r_x3": 320.81699, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.79889, "r_y0": 461.52264, "r_x1": 485.75772000000006, "r_y1": 461.52264, "r_x2": 485.75772000000006, "r_y2": 452.61609, "r_x3": 330.79889, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.073, "r_y0": 461.29352, "r_x1": 511.86368, "r_y1": 461.29352, "r_x2": 511.86368, "r_y2": 452.70575, "r_x3": 488.073, "r_y3": 452.70575, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86301, "r_y0": 461.52264, "r_x1": 545.10815, "r_y1": 461.52264, "r_x2": 545.10815, "r_y2": 452.61609, "r_x3": 511.86301, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 473.47763, "r_x1": 545.11505, "r_y1": 473.47763, "r_x2": 545.11505, "r_y2": 464.57108, "r_x3": 308.862, "r_y3": 464.57108, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 485.43362, "r_x1": 545.11517, "r_y1": 485.43362, "r_x2": 545.11517, "r_y2": 476.52707, "r_x3": 308.862, "r_y3": 476.52707, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.38861, "r_x1": 379.14816, "r_y1": 497.38861, "r_x2": 379.14816, "r_y2": 488.48206, "r_x3": 308.862, "r_y3": 488.48206, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 308.862, "t": 501.19604, "r": 545.1153, "b": 545.96858, "coord_origin": "TOPLEFT" }, "confidence": 0.9710659980773926, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 510.1026, "r_x1": 328.66177, "r_y1": 510.1026, "r_x2": 328.66177, "r_y2": 501.19604, "r_x3": 320.81699, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2767, "r_y0": 510.1026, "r_x1": 545.11493, "r_y1": 510.1026, "r_x2": 545.11493, "r_y2": 501.19604, "r_x3": 331.2767, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 522.05759, "r_x1": 545.1153, "r_y1": 522.05759, "r_x2": 545.1153, "r_y2": 513.15103, "r_x3": 308.862, "r_y3": 513.15103, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 534.01358, "r_x1": 384.29883, "r_y1": 534.01358, "r_x2": 384.29883, "r_y2": 525.10703, "r_x3": 308.862, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25272, "r_y0": 534.01358, "r_x1": 545.11511, "r_y1": 534.01358, "r_x2": 545.11511, "r_y2": 525.10703, "r_x3": 391.25272, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.96858, "r_x1": 496.15897000000007, "r_y1": 545.96858, "r_x2": 496.15897000000007, "r_y2": 537.06203, "r_x3": 308.862, "r_y3": 537.06203, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 308.862, "t": 549.77603, "r": 545.11517, "b": 606.50359, "coord_origin": "TOPLEFT" }, "confidence": 0.9778757095336914, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 558.68259, "r_x1": 328.28894, "r_y1": 558.68259, "r_x2": 328.28894, "r_y2": 549.77603, "r_x3": 320.81699, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.40222, "r_y0": 558.68259, "r_x1": 545.11499, "r_y1": 558.68259, "r_x2": 545.11499, "r_y2": 549.77603, "r_x3": 335.40222, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 570.63759, "r_x1": 545.11517, "r_y1": 570.63759, "r_x2": 545.11517, "r_y2": 561.73103, "r_x3": 308.862, "r_y3": 561.73103, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 582.59259, "r_x1": 545.11511, "r_y1": 582.59259, "r_x2": 545.11511, "r_y2": 573.68604, "r_x3": 308.862, "r_y3": 573.68604, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 594.54858, "r_x1": 545.11505, "r_y1": 594.54858, "r_x2": 545.11505, "r_y2": 585.64203, "r_x3": 308.862, "r_y3": 585.64203, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 606.50359, "r_x1": 341.2305, "r_y1": 606.50359, "r_x2": 341.2305, "r_y2": 597.59703, "r_x3": 308.862, "r_y3": 597.59703, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "section_header", "bbox": { "l": 308.862, "t": 622.2905900000001, "r": 545.10876, "b": 646.98631, "coord_origin": "TOPLEFT" }, "confidence": 0.954940915107727, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 633.03831, "r_x1": 316.76675, "r_y1": 633.03831, "r_x2": 316.76675, "r_y2": 622.2905900000001, "r_x3": 308.862, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.30643, "r_y0": 633.03831, "r_x1": 545.10876, "r_y1": 633.03831, "r_x2": 545.10876, "r_y2": 622.2905900000001, "r_x3": 327.30643, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 646.98631, "r_x1": 357.34055, "r_y1": 646.98631, "r_x2": 357.34055, "r_y2": 636.2385899999999, "r_x3": 326.79501, "r_y3": 636.2385899999999, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.86203, "t": 657.42104, "r": 545.11517, "b": 714.148605, "coord_origin": "TOPLEFT" }, "confidence": 0.9829329252243042, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 666.3276, "r_x1": 545.11499, "r_y1": 666.3276, "r_x2": 545.11499, "r_y2": 657.42104, "r_x3": 320.81702, "r_y3": 657.42104, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 678.2826, "r_x1": 545.11511, "r_y1": 678.2826, "r_x2": 545.11511, "r_y2": 669.37604, "r_x3": 308.86203, "r_y3": 669.37604, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 690.2376, "r_x1": 545.11517, "r_y1": 690.2376, "r_x2": 545.11517, "r_y2": 681.33104, "r_x3": 308.86203, "r_y3": 681.33104, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 702.1926040000001, "r_x1": 545.11505, "r_y1": 702.1926040000001, "r_x2": 545.11505, "r_y2": 693.286041, "r_x3": 308.86203, "r_y3": 693.286041, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 714.148605, "r_x1": 371.42719, "r_y1": 714.148605, "r_x2": 371.42719, "r_y2": 705.242035, "r_x3": 308.86203, "r_y3": 705.242035, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "page_footer", "bbox": { "l": 292.63104, "t": 734.1330379999999, "r": 302.59363, "b": 743.0396, "coord_origin": "TOPLEFT" }, "confidence": 0.8986663222312927, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63104, "r_y0": 743.0396, "r_x1": 302.59363, "r_y1": 743.0396, "r_x2": 302.59363, "r_y2": 734.1330379999999, "r_x3": 292.63104, "r_y3": 734.1330379999999, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 18, "page_no": 10, "cluster": { "id": 18, "label": "section_header", "bbox": { "l": 132.842, "t": 110.57488999999998, "r": 465.37591999999995, "b": 135.53008999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.6497084498405457, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.842, "r_y0": 121.32263, "r_x1": 465.37591999999995, "r_y1": 121.32263, "r_x2": 465.37591999999995, "r_y2": 110.57488999999998, "r_x3": 132.842, "r_y3": 110.57488999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18399, "r_y0": 135.53008999999997, "r_x1": 375.04269, "r_y1": 135.53008999999997, "r_x2": 375.04269, "r_y2": 122.25982999999997, "r_x3": 220.18399, "r_y3": 122.25982999999997, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material" }, { "label": "section_header", "id": 13, "page_no": 10, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.111984, "t": 161.16089, "r": 175.96437, "b": 171.90863000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9454860091209412, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 171.90863000000002, "r_x1": 57.089828, "r_y1": 171.90863000000002, "r_x2": 57.089828, "r_y2": 161.16089, "r_x3": 50.111984, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.393616, "r_y0": 171.90863000000002, "r_x1": 175.96437, "r_y1": 171.90863000000002, "r_x2": 175.96437, "r_y2": 161.16089, "r_x3": 66.393616, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Details on the datasets" }, { "label": "section_header", "id": 11, "page_no": 10, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 50.111984, "t": 180.97931000000005, "r": 150.36401, "b": 190.83136000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9535645842552185, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 190.83136000000002, "r_x1": 64.210808, "r_y1": 190.83136000000002, "r_x2": 64.210808, "r_y2": 180.97931000000005, "r_x3": 50.111984, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.610023, "r_y0": 190.83136000000002, "r_x1": 150.36401, "r_y1": 190.83136000000002, "r_x2": 150.36401, "r_y2": 180.97931000000005, "r_x3": 73.610023, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.1. Data preparation" }, { "label": "text", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.111984, "t": 199.92029000000002, "r": 286.36514, "b": 388.15482000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9864971041679382, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 208.82683999999995, "r_x1": 286.36496, "r_y1": 208.82683999999995, "r_x2": 286.36496, "r_y2": 199.92029000000002, "r_x3": 62.06698600000001, "r_y3": 199.92029000000002, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 220.78283999999996, "r_x1": 286.36505, "r_y1": 220.78283999999996, "r_x2": 286.36505, "r_y2": 211.87627999999995, "r_x3": 50.111984, "r_y3": 211.87627999999995, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 232.73784999999998, "r_x1": 286.36514, "r_y1": 232.73784999999998, "r_x2": 286.36514, "r_y2": 223.83130000000006, "r_x3": 50.111984, "r_y3": 223.83130000000006, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 244.69286999999997, "r_x1": 286.36508, "r_y1": 244.69286999999997, "r_x2": 286.36508, "r_y2": 235.78632000000005, "r_x3": 50.111984, "r_y3": 235.78632000000005, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 256.64788999999996, "r_x1": 286.36505, "r_y1": 256.64788999999996, "r_x2": 286.36505, "r_y2": 247.74132999999995, "r_x3": 50.111984, "r_y3": 247.74132999999995, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 268.60290999999995, "r_x1": 286.36505, "r_y1": 268.60290999999995, "r_x2": 286.36505, "r_y2": 259.69635000000005, "r_x3": 50.111984, "r_y3": 259.69635000000005, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 280.55792, "r_x1": 286.36505, "r_y1": 280.55792, "r_x2": 286.36505, "r_y2": 271.65137000000004, "r_x3": 50.111984, "r_y3": 271.65137000000004, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 292.5139199999999, "r_x1": 286.36502, "r_y1": 292.5139199999999, "r_x2": 286.36502, "r_y2": 283.60736, "r_x3": 50.111984, "r_y3": 283.60736, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 304.4689, "r_x1": 286.36505, "r_y1": 304.4689, "r_x2": 286.36505, "r_y2": 295.56235, "r_x3": 50.111984, "r_y3": 295.56235, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 316.42389, "r_x1": 286.36508, "r_y1": 316.42389, "r_x2": 286.36508, "r_y2": 307.5173300000001, "r_x3": 50.111984, "r_y3": 307.5173300000001, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 328.3788799999999, "r_x1": 286.36505, "r_y1": 328.3788799999999, "r_x2": 286.36505, "r_y2": 319.47232, "r_x3": 50.111984, "r_y3": 319.47232, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 340.33386, "r_x1": 286.36502, "r_y1": 340.33386, "r_x2": 286.36502, "r_y2": 331.42731000000003, "r_x3": 50.111984, "r_y3": 331.42731000000003, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 352.28986, "r_x1": 286.36508, "r_y1": 352.28986, "r_x2": 286.36508, "r_y2": 343.3833, "r_x3": 50.111984, "r_y3": 343.3833, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 364.24484000000007, "r_x1": 286.36505, "r_y1": 364.24484000000007, "r_x2": 286.36505, "r_y2": 355.33829, "r_x3": 50.111984, "r_y3": 355.33829, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 376.19983, "r_x1": 286.36508, "r_y1": 376.19983, "r_x2": 286.36508, "r_y2": 367.29327, "r_x3": 50.111984, "r_y3": 367.29327, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 388.15482000000003, "r_x1": 230.80364999999998, "r_y1": 388.15482000000003, "r_x2": 230.80364999999998, "r_y2": 379.24826, "r_x3": 50.111984, "r_y3": 379.24826, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length." }, { "label": "text", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.111984, "t": 391.40527, "r": 286.36511, "b": 627.4597, "coord_origin": "TOPLEFT" }, "confidence": 0.9826022386550903, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 400.31183, "r_x1": 286.36499, "r_y1": 400.31183, "r_x2": 286.36499, "r_y2": 391.40527, "r_x3": 62.06698600000001, "r_y3": 391.40527, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 412.26681999999994, "r_x1": 286.36508, "r_y1": 412.26681999999994, "r_x2": 286.36508, "r_y2": 403.36026, "r_x3": 50.111984, "r_y3": 403.36026, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 424.22180000000003, "r_x1": 286.36505, "r_y1": 424.22180000000003, "r_x2": 286.36505, "r_y2": 415.31525, "r_x3": 50.111984, "r_y3": 415.31525, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 436.1778, "r_x1": 286.36505, "r_y1": 436.1778, "r_x2": 286.36505, "r_y2": 427.2712399999999, "r_x3": 50.111984, "r_y3": 427.2712399999999, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 448.1327800000001, "r_x1": 286.36508, "r_y1": 448.1327800000001, "r_x2": 286.36508, "r_y2": 439.22623, "r_x3": 50.111984, "r_y3": 439.22623, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 460.08777, "r_x1": 286.36511, "r_y1": 460.08777, "r_x2": 286.36511, "r_y2": 451.18121, "r_x3": 50.111984, "r_y3": 451.18121, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 472.04276, "r_x1": 286.36505, "r_y1": 472.04276, "r_x2": 286.36505, "r_y2": 463.1362, "r_x3": 50.111984, "r_y3": 463.1362, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 483.99774, "r_x1": 286.36508, "r_y1": 483.99774, "r_x2": 286.36508, "r_y2": 475.09119, "r_x3": 50.111984, "r_y3": 475.09119, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 495.95273, "r_x1": 286.36502, "r_y1": 495.95273, "r_x2": 286.36502, "r_y2": 487.04617, "r_x3": 50.111984, "r_y3": 487.04617, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 507.90872, "r_x1": 286.36511, "r_y1": 507.90872, "r_x2": 286.36511, "r_y2": 499.00217, "r_x3": 50.111984, "r_y3": 499.00217, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 519.8637100000001, "r_x1": 286.36508, "r_y1": 519.8637100000001, "r_x2": 286.36508, "r_y2": 510.95715, "r_x3": 50.111984, "r_y3": 510.95715, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 531.8187, "r_x1": 286.36508, "r_y1": 531.8187, "r_x2": 286.36508, "r_y2": 522.91214, "r_x3": 50.111984, "r_y3": 522.91214, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 543.7737, "r_x1": 286.36505, "r_y1": 543.7737, "r_x2": 286.36505, "r_y2": 534.86713, "r_x3": 50.111984, "r_y3": 534.86713, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 555.7287, "r_x1": 286.36502, "r_y1": 555.7287, "r_x2": 286.36502, "r_y2": 546.82214, "r_x3": 50.111984, "r_y3": 546.82214, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 567.68469, "r_x1": 257.47351, "r_y1": 567.68469, "r_x2": 257.47351, "r_y2": 558.77814, "r_x3": 50.111984, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.94919, "r_y0": 567.68469, "r_x1": 286.36505, "r_y1": 567.68469, "r_x2": 286.36505, "r_y2": 558.77814, "r_x3": 263.94919, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 579.63969, "r_x1": 286.36508, "r_y1": 579.63969, "r_x2": 286.36508, "r_y2": 570.73314, "r_x3": 50.111984, "r_y3": 570.73314, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 591.5947, "r_x1": 286.36511, "r_y1": 591.5947, "r_x2": 286.36511, "r_y2": 582.68814, "r_x3": 50.111984, "r_y3": 582.68814, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 603.5497, "r_x1": 286.36511, "r_y1": 603.5497, "r_x2": 286.36511, "r_y2": 594.64314, "r_x3": 50.111984, "r_y3": 594.64314, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 615.5047, "r_x1": 286.36505, "r_y1": 615.5047, "r_x2": 286.36505, "r_y2": 606.5981400000001, "r_x3": 50.111984, "r_y3": 606.5981400000001, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 627.4597, "r_x1": 242.2606, "r_y1": 627.4597, "r_x2": 242.2606, "r_y2": 618.55315, "r_x3": 50.111984, "r_y3": 618.55315, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 14, "page_no": 10, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.111984, "t": 630.71014, "r": 286.36496, "b": 651.57269, "coord_origin": "TOPLEFT" }, "confidence": 0.9335853457450867, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 639.6167, "r_x1": 286.36496, "r_y1": 639.6167, "r_x2": 286.36496, "r_y2": 630.71014, "r_x3": 62.06698600000001, "r_y3": 630.71014, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 651.57269, "r_x1": 179.90472, "r_y1": 651.57269, "r_x2": 179.90472, "r_y2": 642.66614, "r_x3": 50.111984, "r_y3": 642.66614, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset." }, { "label": "section_header", "id": 12, "page_no": 10, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.111984, "t": 662.39014, "r": 153.60785, "b": 672.24219, "coord_origin": "TOPLEFT" }, "confidence": 0.9515743255615234, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 672.24219, "r_x1": 64.297272, "r_y1": 672.24219, "r_x2": 64.297272, "r_y2": 662.39014, "r_x3": 50.111984, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.754135, "r_y0": 672.24219, "r_x1": 153.60785, "r_y1": 672.24219, "r_x2": 153.60785, "r_y2": 662.39014, "r_x3": 73.754135, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.2. Synthetic datasets" }, { "label": "text", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.111984, "t": 681.33113, "r": 286.36505, "b": 714.147705, "coord_origin": "TOPLEFT" }, "confidence": 0.9783332347869873, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 690.2377, "r_x1": 286.36493, "r_y1": 690.2377, "r_x2": 286.36493, "r_y2": 681.33113, "r_x3": 62.06698600000001, "r_y3": 681.33113, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 702.1927029999999, "r_x1": 286.36505, "r_y1": 702.1927029999999, "r_x2": 286.36505, "r_y2": 693.2861330000001, "r_x3": 50.111984, "r_y3": 693.2861330000001, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 714.147705, "r_x1": 84.144226, "r_y1": 714.147705, "r_x2": 84.144226, "r_y2": 705.241135, "r_x3": 50.111984, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.237595, "r_y0": 714.147705, "r_x1": 286.36505, "r_y1": 714.147705, "r_x2": 286.36505, "r_y2": 705.241135, "r_x3": 91.237595, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-" }, { "label": "text", "id": 8, "page_no": 10, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.862, "t": 162.65515000000005, "r": 545.11511, "b": 207.42773, "coord_origin": "TOPLEFT" }, "confidence": 0.9596064686775208, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 171.56170999999995, "r_x1": 545.11511, "r_y1": 171.56170999999995, "r_x2": 545.11511, "r_y2": 162.65515000000005, "r_x3": 308.862, "r_y3": 162.65515000000005, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.51671999999996, "r_x1": 545.11511, "r_y1": 183.51671999999996, "r_x2": 545.11511, "r_y2": 174.61017000000004, "r_x3": 308.862, "r_y3": 174.61017000000004, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 195.47173999999995, "r_x1": 545.11511, "r_y1": 195.47173999999995, "r_x2": 545.11511, "r_y2": 186.56519000000003, "r_x3": 308.862, "r_y3": 186.56519000000003, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 207.42773, "r_x1": 484.07434, "r_y1": 207.42773, "r_x2": 484.07434, "r_y2": 198.52117999999996, "r_x3": 308.862, "r_y3": 198.52117999999996, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)." }, { "label": "text", "id": 15, "page_no": 10, "cluster": { "id": 15, "label": "text", "bbox": { "l": 308.862, "t": 211.23517000000004, "r": 545.11505, "b": 232.09673999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9261796474456787, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 220.14171999999996, "r_x1": 545.11505, "r_y1": 220.14171999999996, "r_x2": 545.11505, "r_y2": 211.23517000000004, "r_x3": 320.81699, "r_y3": 211.23517000000004, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 232.09673999999995, "r_x1": 448.08939, "r_y1": 232.09673999999995, "r_x2": 448.08939, "r_y2": 223.19019000000003, "r_x3": 308.862, "r_y3": 223.19019000000003, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The process of generating a synthetic dataset can be decomposed into the following steps:" }, { "label": "list_item", "id": 7, "page_no": 10, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 308.862, "t": 235.90521, "r": 545.11511, "b": 316.54279, "coord_origin": "TOPLEFT" }, "confidence": 0.9642952680587769, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 244.81177000000002, "r_x1": 328.28894, "r_y1": 244.81177000000002, "r_x2": 328.28894, "r_y2": 235.90521, "r_x3": 320.81699, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38232, "r_y0": 244.81177000000002, "r_x1": 545.11499, "r_y1": 244.81177000000002, "r_x2": 545.11499, "r_y2": 235.90521, "r_x3": 335.38232, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 256.76678000000004, "r_x1": 545.11511, "r_y1": 256.76678000000004, "r_x2": 545.11511, "r_y2": 247.86023, "r_x3": 308.862, "r_y3": 247.86023, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 268.72180000000003, "r_x1": 545.11511, "r_y1": 268.72180000000003, "r_x2": 545.11511, "r_y2": 259.81525, "r_x3": 308.862, "r_y3": 259.81525, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 280.67682, "r_x1": 393.3847, "r_y1": 280.67682, "r_x2": 393.3847, "r_y2": 271.77026, "r_x3": 308.862, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.11942, "r_y0": 280.67682, "r_x1": 545.11511, "r_y1": 280.67682, "r_x2": 545.11511, "r_y2": 271.77026, "r_x3": 400.11942, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 292.63181, "r_x1": 545.11505, "r_y1": 292.63181, "r_x2": 545.11505, "r_y2": 283.72524999999996, "r_x3": 308.862, "r_y3": 283.72524999999996, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 304.5878000000001, "r_x1": 545.11511, "r_y1": 304.5878000000001, "r_x2": 545.11511, "r_y2": 295.68124, "r_x3": 308.862, "r_y3": 295.68124, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 316.54279, "r_x1": 425.69348, "r_y1": 316.54279, "r_x2": 425.69348, "r_y2": 307.63623, "r_x3": 308.862, "r_y3": 307.63623, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)." }, { "label": "list_item", "id": 6, "page_no": 10, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.862, "t": 320.35022, "r": 545.11517, "b": 448.80865, "coord_origin": "TOPLEFT" }, "confidence": 0.9699994921684265, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 329.25677, "r_x1": 328.4949, "r_y1": 329.25677, "r_x2": 328.4949, "r_y2": 320.35022, "r_x3": 320.81699, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05423, "r_y0": 329.25677, "r_x1": 545.11499, "r_y1": 329.25677, "r_x2": 545.11499, "r_y2": 320.35022, "r_x3": 331.05423, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 341.21176, "r_x1": 545.11517, "r_y1": 341.21176, "r_x2": 545.11517, "r_y2": 332.30521000000005, "r_x3": 308.862, "r_y3": 332.30521000000005, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 353.16675, "r_x1": 545.11505, "r_y1": 353.16675, "r_x2": 545.11505, "r_y2": 344.26018999999997, "r_x3": 308.862, "r_y3": 344.26018999999997, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 365.12273999999996, "r_x1": 545.11511, "r_y1": 365.12273999999996, "r_x2": 545.11511, "r_y2": 356.21619, "r_x3": 308.862, "r_y3": 356.21619, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 377.07773, "r_x1": 545.11511, "r_y1": 377.07773, "r_x2": 545.11511, "r_y2": 368.17117, "r_x3": 308.862, "r_y3": 368.17117, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 389.03271, "r_x1": 545.11499, "r_y1": 389.03271, "r_x2": 545.11499, "r_y2": 380.12616, "r_x3": 308.862, "r_y3": 380.12616, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.98769999999996, "r_x1": 545.11517, "r_y1": 400.98769999999996, "r_x2": 545.11517, "r_y2": 392.08115, "r_x3": 308.862, "r_y3": 392.08115, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.94269, "r_x1": 545.11511, "r_y1": 412.94269, "r_x2": 545.11511, "r_y2": 404.03613000000007, "r_x3": 308.862, "r_y3": 404.03613000000007, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.89767, "r_x1": 545.11499, "r_y1": 424.89767, "r_x2": 545.11499, "r_y2": 415.99112, "r_x3": 308.862, "r_y3": 415.99112, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.85367, "r_x1": 545.11517, "r_y1": 436.85367, "r_x2": 545.11517, "r_y2": 427.94711, "r_x3": 308.862, "r_y3": 427.94711, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.80865, "r_x1": 345.94278, "r_y1": 448.80865, "r_x2": 345.94278, "r_y2": 439.9021, "r_x3": 308.862, "r_y3": 439.9021, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans." }, { "label": "list_item", "id": 9, "page_no": 10, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 452.61609, "r": 545.11517, "b": 497.38861, "coord_origin": "TOPLEFT" }, "confidence": 0.9568928480148315, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 461.52264, "r_x1": 328.30341, "r_y1": 461.52264, "r_x2": 328.30341, "r_y2": 452.61609, "r_x3": 320.81699, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.79889, "r_y0": 461.52264, "r_x1": 485.75772000000006, "r_y1": 461.52264, "r_x2": 485.75772000000006, "r_y2": 452.61609, "r_x3": 330.79889, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.073, "r_y0": 461.29352, "r_x1": 511.86368, "r_y1": 461.29352, "r_x2": 511.86368, "r_y2": 452.70575, "r_x3": 488.073, "r_y3": 452.70575, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86301, "r_y0": 461.52264, "r_x1": 545.10815, "r_y1": 461.52264, "r_x2": 545.10815, "r_y2": 452.61609, "r_x3": 511.86301, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 473.47763, "r_x1": 545.11505, "r_y1": 473.47763, "r_x2": 545.11505, "r_y2": 464.57108, "r_x3": 308.862, "r_y3": 464.57108, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 485.43362, "r_x1": 545.11517, "r_y1": 485.43362, "r_x2": 545.11517, "r_y2": 476.52707, "r_x3": 308.862, "r_y3": 476.52707, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.38861, "r_x1": 379.14816, "r_y1": 497.38861, "r_x2": 379.14816, "r_y2": 488.48206, "r_x3": 308.862, "r_y3": 488.48206, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content." }, { "label": "list_item", "id": 5, "page_no": 10, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 308.862, "t": 501.19604, "r": 545.1153, "b": 545.96858, "coord_origin": "TOPLEFT" }, "confidence": 0.9710659980773926, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 510.1026, "r_x1": 328.66177, "r_y1": 510.1026, "r_x2": 328.66177, "r_y2": 501.19604, "r_x3": 320.81699, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2767, "r_y0": 510.1026, "r_x1": 545.11493, "r_y1": 510.1026, "r_x2": 545.11493, "r_y2": 501.19604, "r_x3": 331.2767, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 522.05759, "r_x1": 545.1153, "r_y1": 522.05759, "r_x2": 545.1153, "r_y2": 513.15103, "r_x3": 308.862, "r_y3": 513.15103, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 534.01358, "r_x1": 384.29883, "r_y1": 534.01358, "r_x2": 384.29883, "r_y2": 525.10703, "r_x3": 308.862, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25272, "r_y0": 534.01358, "r_x1": 545.11511, "r_y1": 534.01358, "r_x2": 545.11511, "r_y2": 525.10703, "r_x3": 391.25272, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.96858, "r_x1": 496.15897000000007, "r_y1": 545.96858, "r_x2": 496.15897000000007, "r_y2": 537.06203, "r_x3": 308.862, "r_y3": 537.06203, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table." }, { "label": "list_item", "id": 4, "page_no": 10, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 308.862, "t": 549.77603, "r": 545.11517, "b": 606.50359, "coord_origin": "TOPLEFT" }, "confidence": 0.9778757095336914, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 558.68259, "r_x1": 328.28894, "r_y1": 558.68259, "r_x2": 328.28894, "r_y2": 549.77603, "r_x3": 320.81699, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.40222, "r_y0": 558.68259, "r_x1": 545.11499, "r_y1": 558.68259, "r_x2": 545.11499, "r_y2": 549.77603, "r_x3": 335.40222, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 570.63759, "r_x1": 545.11517, "r_y1": 570.63759, "r_x2": 545.11517, "r_y2": 561.73103, "r_x3": 308.862, "r_y3": 561.73103, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 582.59259, "r_x1": 545.11511, "r_y1": 582.59259, "r_x2": 545.11511, "r_y2": 573.68604, "r_x3": 308.862, "r_y3": 573.68604, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 594.54858, "r_x1": 545.11505, "r_y1": 594.54858, "r_x2": 545.11505, "r_y2": 585.64203, "r_x3": 308.862, "r_y3": 585.64203, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 606.50359, "r_x1": 341.2305, "r_y1": 606.50359, "r_x2": 341.2305, "r_y2": 597.59703, "r_x3": 308.862, "r_y3": 597.59703, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process." }, { "label": "section_header", "id": 10, "page_no": 10, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 308.862, "t": 622.2905900000001, "r": 545.10876, "b": 646.98631, "coord_origin": "TOPLEFT" }, "confidence": 0.954940915107727, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 633.03831, "r_x1": 316.76675, "r_y1": 633.03831, "r_x2": 316.76675, "r_y2": 622.2905900000001, "r_x3": 308.862, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.30643, "r_y0": 633.03831, "r_x1": 545.10876, "r_y1": 633.03831, "r_x2": 545.10876, "r_y2": 622.2905900000001, "r_x3": 327.30643, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 646.98631, "r_x1": 357.34055, "r_y1": 646.98631, "r_x2": 357.34055, "r_y2": 636.2385899999999, "r_x3": 326.79501, "r_y3": 636.2385899999999, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Prediction post-processing for PDF documents" }, { "label": "text", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86203, "t": 657.42104, "r": 545.11517, "b": 714.148605, "coord_origin": "TOPLEFT" }, "confidence": 0.9829329252243042, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 666.3276, "r_x1": 545.11499, "r_y1": 666.3276, "r_x2": 545.11499, "r_y2": 657.42104, "r_x3": 320.81702, "r_y3": 657.42104, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 678.2826, "r_x1": 545.11511, "r_y1": 678.2826, "r_x2": 545.11511, "r_y2": 669.37604, "r_x3": 308.86203, "r_y3": 669.37604, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 690.2376, "r_x1": 545.11517, "r_y1": 690.2376, "r_x2": 545.11517, "r_y2": 681.33104, "r_x3": 308.86203, "r_y3": 681.33104, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 702.1926040000001, "r_x1": 545.11505, "r_y1": 702.1926040000001, "r_x2": 545.11505, "r_y2": 693.286041, "r_x3": 308.86203, "r_y3": 693.286041, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 714.148605, "r_x1": 371.42719, "r_y1": 714.148605, "r_x2": 371.42719, "r_y2": 705.242035, "r_x3": 308.86203, "r_y3": 705.242035, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:" }, { "label": "page_footer", "id": 16, "page_no": 10, "cluster": { "id": 16, "label": "page_footer", "bbox": { "l": 292.63104, "t": 734.1330379999999, "r": 302.59363, "b": 743.0396, "coord_origin": "TOPLEFT" }, "confidence": 0.8986663222312927, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63104, "r_y0": 743.0396, "r_x1": 302.59363, "r_y1": 743.0396, "r_x2": 302.59363, "r_y2": 734.1330379999999, "r_x3": 292.63104, "r_y3": 734.1330379999999, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" } ], "body": [ { "label": "section_header", "id": 18, "page_no": 10, "cluster": { "id": 18, "label": "section_header", "bbox": { "l": 132.842, "t": 110.57488999999998, "r": 465.37591999999995, "b": 135.53008999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.6497084498405457, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.842, "r_y0": 121.32263, "r_x1": 465.37591999999995, "r_y1": 121.32263, "r_x2": 465.37591999999995, "r_y2": 110.57488999999998, "r_x3": 132.842, "r_y3": 110.57488999999998, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18399, "r_y0": 135.53008999999997, "r_x1": 375.04269, "r_y1": 135.53008999999997, "r_x2": 375.04269, "r_y2": 122.25982999999997, "r_x3": 220.18399, "r_y3": 122.25982999999997, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material" }, { "label": "section_header", "id": 13, "page_no": 10, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.111984, "t": 161.16089, "r": 175.96437, "b": 171.90863000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9454860091209412, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 171.90863000000002, "r_x1": 57.089828, "r_y1": 171.90863000000002, "r_x2": 57.089828, "r_y2": 161.16089, "r_x3": 50.111984, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.393616, "r_y0": 171.90863000000002, "r_x1": 175.96437, "r_y1": 171.90863000000002, "r_x2": 175.96437, "r_y2": 161.16089, "r_x3": 66.393616, "r_y3": 161.16089, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Details on the datasets" }, { "label": "section_header", "id": 11, "page_no": 10, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 50.111984, "t": 180.97931000000005, "r": 150.36401, "b": 190.83136000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9535645842552185, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 190.83136000000002, "r_x1": 64.210808, "r_y1": 190.83136000000002, "r_x2": 64.210808, "r_y2": 180.97931000000005, "r_x3": 50.111984, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.610023, "r_y0": 190.83136000000002, "r_x1": 150.36401, "r_y1": 190.83136000000002, "r_x2": 150.36401, "r_y2": 180.97931000000005, "r_x3": 73.610023, "r_y3": 180.97931000000005, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.1. Data preparation" }, { "label": "text", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.111984, "t": 199.92029000000002, "r": 286.36514, "b": 388.15482000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9864971041679382, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 208.82683999999995, "r_x1": 286.36496, "r_y1": 208.82683999999995, "r_x2": 286.36496, "r_y2": 199.92029000000002, "r_x3": 62.06698600000001, "r_y3": 199.92029000000002, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 220.78283999999996, "r_x1": 286.36505, "r_y1": 220.78283999999996, "r_x2": 286.36505, "r_y2": 211.87627999999995, "r_x3": 50.111984, "r_y3": 211.87627999999995, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 232.73784999999998, "r_x1": 286.36514, "r_y1": 232.73784999999998, "r_x2": 286.36514, "r_y2": 223.83130000000006, "r_x3": 50.111984, "r_y3": 223.83130000000006, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 244.69286999999997, "r_x1": 286.36508, "r_y1": 244.69286999999997, "r_x2": 286.36508, "r_y2": 235.78632000000005, "r_x3": 50.111984, "r_y3": 235.78632000000005, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 256.64788999999996, "r_x1": 286.36505, "r_y1": 256.64788999999996, "r_x2": 286.36505, "r_y2": 247.74132999999995, "r_x3": 50.111984, "r_y3": 247.74132999999995, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 268.60290999999995, "r_x1": 286.36505, "r_y1": 268.60290999999995, "r_x2": 286.36505, "r_y2": 259.69635000000005, "r_x3": 50.111984, "r_y3": 259.69635000000005, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 280.55792, "r_x1": 286.36505, "r_y1": 280.55792, "r_x2": 286.36505, "r_y2": 271.65137000000004, "r_x3": 50.111984, "r_y3": 271.65137000000004, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 292.5139199999999, "r_x1": 286.36502, "r_y1": 292.5139199999999, "r_x2": 286.36502, "r_y2": 283.60736, "r_x3": 50.111984, "r_y3": 283.60736, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 304.4689, "r_x1": 286.36505, "r_y1": 304.4689, "r_x2": 286.36505, "r_y2": 295.56235, "r_x3": 50.111984, "r_y3": 295.56235, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 316.42389, "r_x1": 286.36508, "r_y1": 316.42389, "r_x2": 286.36508, "r_y2": 307.5173300000001, "r_x3": 50.111984, "r_y3": 307.5173300000001, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 328.3788799999999, "r_x1": 286.36505, "r_y1": 328.3788799999999, "r_x2": 286.36505, "r_y2": 319.47232, "r_x3": 50.111984, "r_y3": 319.47232, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 340.33386, "r_x1": 286.36502, "r_y1": 340.33386, "r_x2": 286.36502, "r_y2": 331.42731000000003, "r_x3": 50.111984, "r_y3": 331.42731000000003, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 352.28986, "r_x1": 286.36508, "r_y1": 352.28986, "r_x2": 286.36508, "r_y2": 343.3833, "r_x3": 50.111984, "r_y3": 343.3833, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 364.24484000000007, "r_x1": 286.36505, "r_y1": 364.24484000000007, "r_x2": 286.36505, "r_y2": 355.33829, "r_x3": 50.111984, "r_y3": 355.33829, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 376.19983, "r_x1": 286.36508, "r_y1": 376.19983, "r_x2": 286.36508, "r_y2": 367.29327, "r_x3": 50.111984, "r_y3": 367.29327, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 388.15482000000003, "r_x1": 230.80364999999998, "r_y1": 388.15482000000003, "r_x2": 230.80364999999998, "r_y2": 379.24826, "r_x3": 50.111984, "r_y3": 379.24826, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length." }, { "label": "text", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.111984, "t": 391.40527, "r": 286.36511, "b": 627.4597, "coord_origin": "TOPLEFT" }, "confidence": 0.9826022386550903, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 400.31183, "r_x1": 286.36499, "r_y1": 400.31183, "r_x2": 286.36499, "r_y2": 391.40527, "r_x3": 62.06698600000001, "r_y3": 391.40527, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 412.26681999999994, "r_x1": 286.36508, "r_y1": 412.26681999999994, "r_x2": 286.36508, "r_y2": 403.36026, "r_x3": 50.111984, "r_y3": 403.36026, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 424.22180000000003, "r_x1": 286.36505, "r_y1": 424.22180000000003, "r_x2": 286.36505, "r_y2": 415.31525, "r_x3": 50.111984, "r_y3": 415.31525, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 436.1778, "r_x1": 286.36505, "r_y1": 436.1778, "r_x2": 286.36505, "r_y2": 427.2712399999999, "r_x3": 50.111984, "r_y3": 427.2712399999999, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 448.1327800000001, "r_x1": 286.36508, "r_y1": 448.1327800000001, "r_x2": 286.36508, "r_y2": 439.22623, "r_x3": 50.111984, "r_y3": 439.22623, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 460.08777, "r_x1": 286.36511, "r_y1": 460.08777, "r_x2": 286.36511, "r_y2": 451.18121, "r_x3": 50.111984, "r_y3": 451.18121, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 472.04276, "r_x1": 286.36505, "r_y1": 472.04276, "r_x2": 286.36505, "r_y2": 463.1362, "r_x3": 50.111984, "r_y3": 463.1362, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 483.99774, "r_x1": 286.36508, "r_y1": 483.99774, "r_x2": 286.36508, "r_y2": 475.09119, "r_x3": 50.111984, "r_y3": 475.09119, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 495.95273, "r_x1": 286.36502, "r_y1": 495.95273, "r_x2": 286.36502, "r_y2": 487.04617, "r_x3": 50.111984, "r_y3": 487.04617, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 507.90872, "r_x1": 286.36511, "r_y1": 507.90872, "r_x2": 286.36511, "r_y2": 499.00217, "r_x3": 50.111984, "r_y3": 499.00217, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 519.8637100000001, "r_x1": 286.36508, "r_y1": 519.8637100000001, "r_x2": 286.36508, "r_y2": 510.95715, "r_x3": 50.111984, "r_y3": 510.95715, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 531.8187, "r_x1": 286.36508, "r_y1": 531.8187, "r_x2": 286.36508, "r_y2": 522.91214, "r_x3": 50.111984, "r_y3": 522.91214, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 543.7737, "r_x1": 286.36505, "r_y1": 543.7737, "r_x2": 286.36505, "r_y2": 534.86713, "r_x3": 50.111984, "r_y3": 534.86713, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 555.7287, "r_x1": 286.36502, "r_y1": 555.7287, "r_x2": 286.36502, "r_y2": 546.82214, "r_x3": 50.111984, "r_y3": 546.82214, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 567.68469, "r_x1": 257.47351, "r_y1": 567.68469, "r_x2": 257.47351, "r_y2": 558.77814, "r_x3": 50.111984, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.94919, "r_y0": 567.68469, "r_x1": 286.36505, "r_y1": 567.68469, "r_x2": 286.36505, "r_y2": 558.77814, "r_x3": 263.94919, "r_y3": 558.77814, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 579.63969, "r_x1": 286.36508, "r_y1": 579.63969, "r_x2": 286.36508, "r_y2": 570.73314, "r_x3": 50.111984, "r_y3": 570.73314, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 591.5947, "r_x1": 286.36511, "r_y1": 591.5947, "r_x2": 286.36511, "r_y2": 582.68814, "r_x3": 50.111984, "r_y3": 582.68814, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 603.5497, "r_x1": 286.36511, "r_y1": 603.5497, "r_x2": 286.36511, "r_y2": 594.64314, "r_x3": 50.111984, "r_y3": 594.64314, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 615.5047, "r_x1": 286.36505, "r_y1": 615.5047, "r_x2": 286.36505, "r_y2": 606.5981400000001, "r_x3": 50.111984, "r_y3": 606.5981400000001, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 627.4597, "r_x1": 242.2606, "r_y1": 627.4597, "r_x2": 242.2606, "r_y2": 618.55315, "r_x3": 50.111984, "r_y3": 618.55315, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 14, "page_no": 10, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.111984, "t": 630.71014, "r": 286.36496, "b": 651.57269, "coord_origin": "TOPLEFT" }, "confidence": 0.9335853457450867, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 639.6167, "r_x1": 286.36496, "r_y1": 639.6167, "r_x2": 286.36496, "r_y2": 630.71014, "r_x3": 62.06698600000001, "r_y3": 630.71014, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 651.57269, "r_x1": 179.90472, "r_y1": 651.57269, "r_x2": 179.90472, "r_y2": 642.66614, "r_x3": 50.111984, "r_y3": 642.66614, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset." }, { "label": "section_header", "id": 12, "page_no": 10, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.111984, "t": 662.39014, "r": 153.60785, "b": 672.24219, "coord_origin": "TOPLEFT" }, "confidence": 0.9515743255615234, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 672.24219, "r_x1": 64.297272, "r_y1": 672.24219, "r_x2": 64.297272, "r_y2": 662.39014, "r_x3": 50.111984, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.754135, "r_y0": 672.24219, "r_x1": 153.60785, "r_y1": 672.24219, "r_x2": 153.60785, "r_y2": 662.39014, "r_x3": 73.754135, "r_y3": 662.39014, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.2. Synthetic datasets" }, { "label": "text", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.111984, "t": 681.33113, "r": 286.36505, "b": 714.147705, "coord_origin": "TOPLEFT" }, "confidence": 0.9783332347869873, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.06698600000001, "r_y0": 690.2377, "r_x1": 286.36493, "r_y1": 690.2377, "r_x2": 286.36493, "r_y2": 681.33113, "r_x3": 62.06698600000001, "r_y3": 681.33113, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 702.1927029999999, "r_x1": 286.36505, "r_y1": 702.1927029999999, "r_x2": 286.36505, "r_y2": 693.2861330000001, "r_x3": 50.111984, "r_y3": 693.2861330000001, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.111984, "r_y0": 714.147705, "r_x1": 84.144226, "r_y1": 714.147705, "r_x2": 84.144226, "r_y2": 705.241135, "r_x3": 50.111984, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.237595, "r_y0": 714.147705, "r_x1": 286.36505, "r_y1": 714.147705, "r_x2": 286.36505, "r_y2": 705.241135, "r_x3": 91.237595, "r_y3": 705.241135, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-" }, { "label": "text", "id": 8, "page_no": 10, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.862, "t": 162.65515000000005, "r": 545.11511, "b": 207.42773, "coord_origin": "TOPLEFT" }, "confidence": 0.9596064686775208, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 171.56170999999995, "r_x1": 545.11511, "r_y1": 171.56170999999995, "r_x2": 545.11511, "r_y2": 162.65515000000005, "r_x3": 308.862, "r_y3": 162.65515000000005, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 183.51671999999996, "r_x1": 545.11511, "r_y1": 183.51671999999996, "r_x2": 545.11511, "r_y2": 174.61017000000004, "r_x3": 308.862, "r_y3": 174.61017000000004, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 195.47173999999995, "r_x1": 545.11511, "r_y1": 195.47173999999995, "r_x2": 545.11511, "r_y2": 186.56519000000003, "r_x3": 308.862, "r_y3": 186.56519000000003, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 207.42773, "r_x1": 484.07434, "r_y1": 207.42773, "r_x2": 484.07434, "r_y2": 198.52117999999996, "r_x3": 308.862, "r_y3": 198.52117999999996, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)." }, { "label": "text", "id": 15, "page_no": 10, "cluster": { "id": 15, "label": "text", "bbox": { "l": 308.862, "t": 211.23517000000004, "r": 545.11505, "b": 232.09673999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9261796474456787, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 220.14171999999996, "r_x1": 545.11505, "r_y1": 220.14171999999996, "r_x2": 545.11505, "r_y2": 211.23517000000004, "r_x3": 320.81699, "r_y3": 211.23517000000004, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 232.09673999999995, "r_x1": 448.08939, "r_y1": 232.09673999999995, "r_x2": 448.08939, "r_y2": 223.19019000000003, "r_x3": 308.862, "r_y3": 223.19019000000003, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The process of generating a synthetic dataset can be decomposed into the following steps:" }, { "label": "list_item", "id": 7, "page_no": 10, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 308.862, "t": 235.90521, "r": 545.11511, "b": 316.54279, "coord_origin": "TOPLEFT" }, "confidence": 0.9642952680587769, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 244.81177000000002, "r_x1": 328.28894, "r_y1": 244.81177000000002, "r_x2": 328.28894, "r_y2": 235.90521, "r_x3": 320.81699, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38232, "r_y0": 244.81177000000002, "r_x1": 545.11499, "r_y1": 244.81177000000002, "r_x2": 545.11499, "r_y2": 235.90521, "r_x3": 335.38232, "r_y3": 235.90521, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 256.76678000000004, "r_x1": 545.11511, "r_y1": 256.76678000000004, "r_x2": 545.11511, "r_y2": 247.86023, "r_x3": 308.862, "r_y3": 247.86023, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 268.72180000000003, "r_x1": 545.11511, "r_y1": 268.72180000000003, "r_x2": 545.11511, "r_y2": 259.81525, "r_x3": 308.862, "r_y3": 259.81525, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 280.67682, "r_x1": 393.3847, "r_y1": 280.67682, "r_x2": 393.3847, "r_y2": 271.77026, "r_x3": 308.862, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.11942, "r_y0": 280.67682, "r_x1": 545.11511, "r_y1": 280.67682, "r_x2": 545.11511, "r_y2": 271.77026, "r_x3": 400.11942, "r_y3": 271.77026, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 292.63181, "r_x1": 545.11505, "r_y1": 292.63181, "r_x2": 545.11505, "r_y2": 283.72524999999996, "r_x3": 308.862, "r_y3": 283.72524999999996, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 304.5878000000001, "r_x1": 545.11511, "r_y1": 304.5878000000001, "r_x2": 545.11511, "r_y2": 295.68124, "r_x3": 308.862, "r_y3": 295.68124, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 316.54279, "r_x1": 425.69348, "r_y1": 316.54279, "r_x2": 425.69348, "r_y2": 307.63623, "r_x3": 308.862, "r_y3": 307.63623, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)." }, { "label": "list_item", "id": 6, "page_no": 10, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.862, "t": 320.35022, "r": 545.11517, "b": 448.80865, "coord_origin": "TOPLEFT" }, "confidence": 0.9699994921684265, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 329.25677, "r_x1": 328.4949, "r_y1": 329.25677, "r_x2": 328.4949, "r_y2": 320.35022, "r_x3": 320.81699, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05423, "r_y0": 329.25677, "r_x1": 545.11499, "r_y1": 329.25677, "r_x2": 545.11499, "r_y2": 320.35022, "r_x3": 331.05423, "r_y3": 320.35022, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 341.21176, "r_x1": 545.11517, "r_y1": 341.21176, "r_x2": 545.11517, "r_y2": 332.30521000000005, "r_x3": 308.862, "r_y3": 332.30521000000005, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 353.16675, "r_x1": 545.11505, "r_y1": 353.16675, "r_x2": 545.11505, "r_y2": 344.26018999999997, "r_x3": 308.862, "r_y3": 344.26018999999997, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 365.12273999999996, "r_x1": 545.11511, "r_y1": 365.12273999999996, "r_x2": 545.11511, "r_y2": 356.21619, "r_x3": 308.862, "r_y3": 356.21619, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 377.07773, "r_x1": 545.11511, "r_y1": 377.07773, "r_x2": 545.11511, "r_y2": 368.17117, "r_x3": 308.862, "r_y3": 368.17117, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 389.03271, "r_x1": 545.11499, "r_y1": 389.03271, "r_x2": 545.11499, "r_y2": 380.12616, "r_x3": 308.862, "r_y3": 380.12616, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 400.98769999999996, "r_x1": 545.11517, "r_y1": 400.98769999999996, "r_x2": 545.11517, "r_y2": 392.08115, "r_x3": 308.862, "r_y3": 392.08115, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 412.94269, "r_x1": 545.11511, "r_y1": 412.94269, "r_x2": 545.11511, "r_y2": 404.03613000000007, "r_x3": 308.862, "r_y3": 404.03613000000007, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 424.89767, "r_x1": 545.11499, "r_y1": 424.89767, "r_x2": 545.11499, "r_y2": 415.99112, "r_x3": 308.862, "r_y3": 415.99112, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 436.85367, "r_x1": 545.11517, "r_y1": 436.85367, "r_x2": 545.11517, "r_y2": 427.94711, "r_x3": 308.862, "r_y3": 427.94711, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 448.80865, "r_x1": 345.94278, "r_y1": 448.80865, "r_x2": 345.94278, "r_y2": 439.9021, "r_x3": 308.862, "r_y3": 439.9021, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans." }, { "label": "list_item", "id": 9, "page_no": 10, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 452.61609, "r": 545.11517, "b": 497.38861, "coord_origin": "TOPLEFT" }, "confidence": 0.9568928480148315, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 461.52264, "r_x1": 328.30341, "r_y1": 461.52264, "r_x2": 328.30341, "r_y2": 452.61609, "r_x3": 320.81699, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.79889, "r_y0": 461.52264, "r_x1": 485.75772000000006, "r_y1": 461.52264, "r_x2": 485.75772000000006, "r_y2": 452.61609, "r_x3": 330.79889, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.073, "r_y0": 461.29352, "r_x1": 511.86368, "r_y1": 461.29352, "r_x2": 511.86368, "r_y2": 452.70575, "r_x3": 488.073, "r_y3": 452.70575, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86301, "r_y0": 461.52264, "r_x1": 545.10815, "r_y1": 461.52264, "r_x2": 545.10815, "r_y2": 452.61609, "r_x3": 511.86301, "r_y3": 452.61609, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 473.47763, "r_x1": 545.11505, "r_y1": 473.47763, "r_x2": 545.11505, "r_y2": 464.57108, "r_x3": 308.862, "r_y3": 464.57108, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 485.43362, "r_x1": 545.11517, "r_y1": 485.43362, "r_x2": 545.11517, "r_y2": 476.52707, "r_x3": 308.862, "r_y3": 476.52707, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 497.38861, "r_x1": 379.14816, "r_y1": 497.38861, "r_x2": 379.14816, "r_y2": 488.48206, "r_x3": 308.862, "r_y3": 488.48206, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content." }, { "label": "list_item", "id": 5, "page_no": 10, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 308.862, "t": 501.19604, "r": 545.1153, "b": 545.96858, "coord_origin": "TOPLEFT" }, "confidence": 0.9710659980773926, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 510.1026, "r_x1": 328.66177, "r_y1": 510.1026, "r_x2": 328.66177, "r_y2": 501.19604, "r_x3": 320.81699, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2767, "r_y0": 510.1026, "r_x1": 545.11493, "r_y1": 510.1026, "r_x2": 545.11493, "r_y2": 501.19604, "r_x3": 331.2767, "r_y3": 501.19604, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 522.05759, "r_x1": 545.1153, "r_y1": 522.05759, "r_x2": 545.1153, "r_y2": 513.15103, "r_x3": 308.862, "r_y3": 513.15103, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 534.01358, "r_x1": 384.29883, "r_y1": 534.01358, "r_x2": 384.29883, "r_y2": 525.10703, "r_x3": 308.862, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25272, "r_y0": 534.01358, "r_x1": 545.11511, "r_y1": 534.01358, "r_x2": 545.11511, "r_y2": 525.10703, "r_x3": 391.25272, "r_y3": 525.10703, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 545.96858, "r_x1": 496.15897000000007, "r_y1": 545.96858, "r_x2": 496.15897000000007, "r_y2": 537.06203, "r_x3": 308.862, "r_y3": 537.06203, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table." }, { "label": "list_item", "id": 4, "page_no": 10, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 308.862, "t": 549.77603, "r": 545.11517, "b": 606.50359, "coord_origin": "TOPLEFT" }, "confidence": 0.9778757095336914, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 558.68259, "r_x1": 328.28894, "r_y1": 558.68259, "r_x2": 328.28894, "r_y2": 549.77603, "r_x3": 320.81699, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.40222, "r_y0": 558.68259, "r_x1": 545.11499, "r_y1": 558.68259, "r_x2": 545.11499, "r_y2": 549.77603, "r_x3": 335.40222, "r_y3": 549.77603, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 570.63759, "r_x1": 545.11517, "r_y1": 570.63759, "r_x2": 545.11517, "r_y2": 561.73103, "r_x3": 308.862, "r_y3": 561.73103, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 582.59259, "r_x1": 545.11511, "r_y1": 582.59259, "r_x2": 545.11511, "r_y2": 573.68604, "r_x3": 308.862, "r_y3": 573.68604, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 594.54858, "r_x1": 545.11505, "r_y1": 594.54858, "r_x2": 545.11505, "r_y2": 585.64203, "r_x3": 308.862, "r_y3": 585.64203, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 606.50359, "r_x1": 341.2305, "r_y1": 606.50359, "r_x2": 341.2305, "r_y2": 597.59703, "r_x3": 308.862, "r_y3": 597.59703, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process." }, { "label": "section_header", "id": 10, "page_no": 10, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 308.862, "t": 622.2905900000001, "r": 545.10876, "b": 646.98631, "coord_origin": "TOPLEFT" }, "confidence": 0.954940915107727, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 633.03831, "r_x1": 316.76675, "r_y1": 633.03831, "r_x2": 316.76675, "r_y2": 622.2905900000001, "r_x3": 308.862, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.30643, "r_y0": 633.03831, "r_x1": 545.10876, "r_y1": 633.03831, "r_x2": 545.10876, "r_y2": 622.2905900000001, "r_x3": 327.30643, "r_y3": 622.2905900000001, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.79501, "r_y0": 646.98631, "r_x1": 357.34055, "r_y1": 646.98631, "r_x2": 357.34055, "r_y2": 636.2385899999999, "r_x3": 326.79501, "r_y3": 636.2385899999999, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Prediction post-processing for PDF documents" }, { "label": "text", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86203, "t": 657.42104, "r": 545.11517, "b": 714.148605, "coord_origin": "TOPLEFT" }, "confidence": 0.9829329252243042, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 666.3276, "r_x1": 545.11499, "r_y1": 666.3276, "r_x2": 545.11499, "r_y2": 657.42104, "r_x3": 320.81702, "r_y3": 657.42104, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 678.2826, "r_x1": 545.11511, "r_y1": 678.2826, "r_x2": 545.11511, "r_y2": 669.37604, "r_x3": 308.86203, "r_y3": 669.37604, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 690.2376, "r_x1": 545.11517, "r_y1": 690.2376, "r_x2": 545.11517, "r_y2": 681.33104, "r_x3": 308.86203, "r_y3": 681.33104, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 702.1926040000001, "r_x1": 545.11505, "r_y1": 702.1926040000001, "r_x2": 545.11505, "r_y2": 693.286041, "r_x3": 308.86203, "r_y3": 693.286041, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 714.148605, "r_x1": 371.42719, "r_y1": 714.148605, "r_x2": 371.42719, "r_y2": 705.242035, "r_x3": 308.86203, "r_y3": 705.242035, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:" } ], "headers": [ { "label": "page_footer", "id": 16, "page_no": 10, "cluster": { "id": 16, "label": "page_footer", "bbox": { "l": 292.63104, "t": 734.1330379999999, "r": 302.59363, "b": 743.0396, "coord_origin": "TOPLEFT" }, "confidence": 0.8986663222312927, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63104, "r_y0": 743.0396, "r_x1": 302.59363, "r_y1": 743.0396, "r_x2": 302.59363, "r_y2": 734.1330379999999, "r_x3": 292.63104, "r_y3": 734.1330379999999, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" } ] } }, { "page_no": 11, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39108, "r_y0": 83.25922000000003, "r_x1": 151.94641, "r_y1": 83.25922000000003, "r_x2": 151.94641, "r_y2": 77.31055000000003, "r_x3": 119.39108, "r_y3": 77.31055000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.345978, "r_y0": 81.14020000000005, "r_x1": 59.327053, "r_y1": 81.14020000000005, "r_x2": 59.327053, "r_y2": 75.19152999999994, "r_x3": 53.345978, "r_y3": 75.19152999999994, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.5791, "r_y0": 83.40698000000009, "r_x1": 319.8266, "r_y1": 83.40698000000009, "r_x2": 319.8266, "r_y2": 77.45830999999998, "r_x3": 289.5791, "r_y3": 77.45830999999998, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37271, "r_y0": 83.20263999999997, "r_x1": 481.75916, "r_y1": 83.20263999999997, "r_x2": 481.75916, "r_y2": 77.25396999999987, "r_x3": 448.37271, "r_y3": 77.25396999999987, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.553436, "r_y0": 146.23339999999996, "r_x1": 94.976013, "r_y1": 146.23339999999996, "r_x2": 94.976013, "r_y2": 141.27617999999995, "r_x3": 82.553436, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.03878399999999, "r_y0": 106.06133999999986, "r_x1": 85.290085, "r_y1": 106.06133999999986, "r_x2": 85.290085, "r_y2": 101.10413000000005, "r_x3": 63.03878399999999, "r_y3": 101.10413000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.76786, "r_y0": 129.35253999999998, "r_x1": 85.231277, "r_y1": 129.35253999999998, "r_x2": 85.231277, "r_y2": 124.39531999999997, "r_x3": 67.76786, "r_y3": 124.39531999999997, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55121, "r_y0": 107.49712999999997, "r_x1": 249.80251, "r_y1": 107.49712999999997, "r_x2": 249.80251, "r_y2": 102.53992000000005, "r_x3": 227.55121, "r_y3": 102.53992000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.19898999999998, "r_y0": 131.94299, "r_x1": 249.66241, "r_y1": 131.94299, "r_x2": 249.66241, "r_y2": 126.98577999999986, "r_x3": 232.19898999999998, "r_y3": 126.98577999999986, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2337, "r_y0": 119.00243999999998, "r_x1": 413.69711, "r_y1": 119.00243999999998, "r_x2": 413.69711, "r_y2": 114.04522999999995, "r_x3": 396.2337, "r_y3": 114.04522999999995, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.382202, "r_y0": 146.23339999999996, "r_x1": 105.08014, "r_y1": 146.23339999999996, "r_x2": 105.08014, "r_y2": 141.27617999999995, "r_x3": 97.382202, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.93763400000001, "r_y0": 90.69042999999999, "r_x1": 76.151443, "r_y1": 90.69042999999999, "r_x2": 76.151443, "r_y2": 85.73321999999996, "r_x3": 60.93763400000001, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.304901, "r_y0": 91.18073000000015, "r_x1": 106.99162, "r_y1": 91.18073000000015, "r_x2": 106.99162, "r_y2": 86.22351000000003, "r_x3": 82.304901, "r_y3": 86.22351000000003, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.20530999999997, "r_y0": 146.56329000000005, "r_x1": 281.88013, "r_y1": 146.56329000000005, "r_x2": 281.88013, "r_y2": 141.60608000000002, "r_x3": 246.20530999999997, "r_y3": 141.60608000000002, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.69780000000003, "r_y0": 90.69042999999999, "r_x1": 241.91161, "r_y1": 90.69042999999999, "r_x2": 241.91161, "r_y2": 85.73321999999996, "r_x3": 226.69780000000003, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.93848999999997, "r_y0": 91.04522999999995, "r_x1": 282.49384, "r_y1": 91.04522999999995, "r_x2": 282.49384, "r_y2": 86.08801000000005, "r_x3": 249.93848999999997, "r_y3": 86.08801000000005, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19409, "r_y0": 146.23339999999996, "r_x1": 444.68915, "r_y1": 146.23339999999996, "r_x2": 444.68915, "r_y2": 141.27617999999995, "r_x3": 410.19409, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37341, "r_y0": 90.69042999999999, "r_x1": 432.6716599999999, "r_y1": 90.69042999999999, "r_x2": 432.6716599999999, "r_y2": 85.73321999999996, "r_x3": 391.37341, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.60571000000004, "r_y0": 91.21862999999996, "r_x1": 445.62414999999993, "r_y1": 91.21862999999996, "r_x2": 445.62414999999993, "r_y2": 86.26140999999996, "r_x3": 435.60571000000004, "r_y3": 86.26140999999996, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.94921, "r_y0": 146.24567000000002, "r_x1": 136.20052, "r_y1": 146.24567000000002, "r_x2": 136.20052, "r_y2": 141.28845, "r_x3": 113.94921, "r_y3": 141.28845, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.91554000000001, "r_y0": 99.77575999999999, "r_x1": 127.05433999999998, "r_y1": 99.77575999999999, "r_x2": 127.05433999999998, "r_y2": 94.81853999999998, "r_x3": 116.91554000000001, "r_y3": 94.81853999999998, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.3146, "r_y0": 105.89575000000002, "r_x1": 127.05298, "r_y1": 105.89575000000002, "r_x2": 127.05298, "r_y2": 100.93853999999999, "r_x3": 113.3146, "r_y3": 100.93853999999999, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94112, "r_y0": 112.01575000000003, "r_x1": 127.05537, "r_y1": 112.01575000000003, "r_x2": 127.05537, "r_y2": 107.05853000000013, "r_x3": 112.94112, "r_y3": 107.05853000000013, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.22738999999999, "r_y0": 127.57245, "r_x1": 126.96577, "r_y1": 127.57245, "r_x2": 126.96577, "r_y2": 122.61523, "r_x3": 113.22738999999999, "r_y3": 122.61523, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85390000000001, "r_y0": 133.69244000000003, "r_x1": 126.96814999999998, "r_y1": 133.69244000000003, "r_x2": 126.96814999999998, "r_y2": 128.73523, "r_x3": 112.85390000000001, "r_y3": 128.73523, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.57864, "r_y0": 146.39362000000006, "r_x1": 156.04207, "r_y1": 146.39362000000006, "r_x2": 156.04207, "r_y2": 141.43640000000005, "r_x3": 138.57864, "r_y3": 141.43640000000005, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03101, "r_y0": 91.22852, "r_x1": 151.04185, "r_y1": 91.22852, "r_x2": 151.04185, "r_y2": 86.2713, "r_x3": 122.03101, "r_y3": 86.2713, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65359, "r_y0": 91.5122100000001, "r_x1": 321.67203, "r_y1": 91.5122100000001, "r_x2": 321.67203, "r_y2": 86.55498999999998, "r_x3": 311.65359, "r_y3": 86.55498999999998, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89441, "r_y0": 146.66785000000004, "r_x1": 310.14572, "r_y1": 146.66785000000004, "r_x2": 310.14572, "r_y2": 141.71063000000004, "r_x3": 287.89441, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.23572, "r_y0": 98.03698999999995, "r_x1": 299.37451, "r_y1": 98.03698999999995, "r_x2": 299.37451, "r_y2": 93.07977000000005, "r_x3": 289.23572, "r_y3": 93.07977000000005, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63513, "r_y0": 104.15698000000009, "r_x1": 299.3735, "r_y1": 104.15698000000009, "r_x2": 299.3735, "r_y2": 99.19976999999994, "r_x3": 285.63513, "r_y3": 99.19976999999994, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26111, "r_y0": 110.27697999999998, "r_x1": 299.37537, "r_y1": 110.27697999999998, "r_x2": 299.37537, "r_y2": 105.31975999999997, "r_x3": 285.26111, "r_y3": 105.31975999999997, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43109, "r_y0": 125.34717, "r_x1": 299.16946, "r_y1": 125.34717, "r_x2": 299.16946, "r_y2": 120.38995, "r_x3": 285.43109, "r_y3": 120.38995, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.05713, "r_y0": 131.46716000000004, "r_x1": 299.17139, "r_y1": 131.46716000000004, "r_x2": 299.17139, "r_y2": 126.50995, "r_x3": 285.05713, "r_y3": 126.50995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.34592, "r_y0": 146.66785000000004, "r_x1": 328.80933, "r_y1": 146.66785000000004, "r_x2": 328.80933, "r_y2": 141.71063000000004, "r_x3": 311.34592, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58362, "r_y0": 91.65075999999999, "r_x1": 309.60205, "r_y1": 91.65075999999999, "r_x2": 309.60205, "r_y2": 86.69353999999998, "r_x3": 299.58362, "r_y3": 86.69353999999998, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04077000000007, "r_y0": 146.62891000000002, "r_x1": 483.50418, "r_y1": 146.62891000000002, "r_x2": 483.50418, "r_y2": 141.67169, "r_x3": 466.04077000000007, "r_y3": 141.67169, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02151, "r_y0": 98.71838000000002, "r_x1": 469.16031000000004, "r_y1": 98.71838000000002, "r_x2": 469.16031000000004, "r_y2": 93.76116999999999, "r_x3": 459.02151, "r_y3": 93.76116999999999, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.4209, "r_y0": 104.83838000000003, "r_x1": 469.15927000000005, "r_y1": 104.83838000000003, "r_x2": 469.15927000000005, "r_y2": 99.88116000000002, "r_x3": 455.4209, "r_y3": 99.88116000000002, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.04691, "r_y0": 110.95836999999995, "r_x1": 469.16115999999994, "r_y1": 110.95836999999995, "r_x2": 469.16115999999994, "r_y2": 106.00116000000014, "r_x3": 455.04691, "r_y3": 106.00116000000014, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39401, "r_y0": 90.52959999999996, "r_x1": 480.6545100000001, "r_y1": 90.52959999999996, "r_x2": 480.6545100000001, "r_y2": 85.57239000000004, "r_x3": 467.39401, "r_y3": 85.57239000000004, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37672, "r_y0": 146.54107999999997, "r_x1": 182.62802, "r_y1": 146.54107999999997, "r_x2": 182.62802, "r_y2": 141.58385999999996, "r_x3": 160.37672, "r_y3": 141.58385999999996, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74265, "r_y0": 99.82201999999995, "r_x1": 173.32664, "r_y1": 99.82201999999995, "r_x2": 173.32664, "r_y2": 94.86481000000003, "r_x3": 153.74265, "r_y3": 94.86481000000003, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50967, "r_y0": 105.94202000000007, "r_x1": 173.3246, "r_y1": 105.94202000000007, "r_x2": 173.3246, "r_y2": 100.98479999999995, "r_x3": 154.50967, "r_y3": 100.98479999999995, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27162, "r_y0": 112.06200999999987, "r_x1": 173.32664, "r_y1": 112.06200999999987, "r_x2": 173.32664, "r_y2": 107.10479999999995, "r_x3": 155.27162, "r_y3": 107.10479999999995, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41302, "r_y0": 112.18970000000002, "r_x1": 345.99701, "r_y1": 112.18970000000002, "r_x2": 345.99701, "r_y2": 107.23248000000001, "r_x3": 326.41302, "r_y3": 107.23248000000001, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.17972, "r_y0": 118.30969000000005, "r_x1": 345.99463, "r_y1": 118.30969000000005, "r_x2": 345.99463, "r_y2": 113.35248000000001, "r_x3": 327.17972, "r_y3": 113.35248000000001, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94131, "r_y0": 124.42969000000005, "r_x1": 345.99634, "r_y1": 124.42969000000005, "r_x2": 345.99634, "r_y2": 119.47247000000004, "r_x3": 327.94131, "r_y3": 119.47247000000004, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.9942, "r_y0": 109.11095999999998, "r_x1": 508.76384999999993, "r_y1": 109.11095999999998, "r_x2": 508.76384999999993, "r_y2": 104.15374999999983, "r_x3": 488.9942, "r_y3": 104.15374999999983, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.1893, "r_y0": 115.2309600000001, "r_x1": 508.76349000000005, "r_y1": 115.2309600000001, "r_x2": 508.76349000000005, "r_y2": 110.27373999999998, "r_x3": 490.1893, "r_y3": 110.27373999999998, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72009, "r_y0": 121.35095000000013, "r_x1": 508.76758, "r_y1": 121.35095000000013, "r_x2": 508.76758, "r_y2": 116.39373999999998, "r_x3": 489.72009, "r_y3": 116.39373999999998, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71121, "r_y0": 127.47095000000002, "r_x1": 508.76624, "r_y1": 127.47095000000002, "r_x2": 508.76624, "r_y2": 122.51373000000001, "r_x3": 490.71121, "r_y3": 122.51373000000001, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.37759, "r_y0": 146.66840000000002, "r_x1": 202.84102, "r_y1": 146.66840000000002, "r_x2": 202.84102, "r_y2": 141.71118, "r_x3": 185.37759, "r_y3": 141.71118, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.50357, "r_y0": 91.09331999999995, "r_x1": 197.52699, "r_y1": 91.09331999999995, "r_x2": 197.52699, "r_y2": 86.13611000000003, "r_x3": 168.50357, "r_y3": 86.13611000000003, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.3768, "r_y0": 90.95428000000004, "r_x1": 367.39523, "r_y1": 90.95428000000004, "r_x2": 367.39523, "r_y2": 85.99707000000001, "r_x3": 357.3768, "r_y3": 85.99707000000001, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73151, "r_y0": 146.58043999999995, "r_x1": 374.92862, "r_y1": 146.58043999999995, "r_x2": 374.92862, "r_y2": 141.62323000000004, "r_x3": 333.73151, "r_y3": 141.62323000000004, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69101, "r_y0": 91.01312000000007, "r_x1": 355.70944, "r_y1": 91.01312000000007, "r_x2": 355.70944, "r_y2": 86.05591000000004, "r_x3": 345.69101, "r_y3": 86.05591000000004, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54248, "r_y0": 146.33405000000005, "r_x1": 526.00592, "r_y1": 146.33405000000005, "r_x2": 526.00592, "r_y2": 141.37683000000004, "r_x3": 508.54248, "r_y3": 141.37683000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.44653000000005, "r_y0": 91.0498, "r_x1": 523.70703, "r_y1": 91.0498, "r_x2": 523.70703, "r_y2": 86.09258999999986, "r_x3": 510.44653000000005, "r_y3": 86.09258999999986, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 174.40894000000003, "r_x1": 545.11371, "r_y1": 174.40894000000003, "r_x2": 545.11371, "r_y2": 165.50238000000002, "r_x3": 50.112, "r_y3": 165.50238000000002, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 186.36395000000005, "r_x1": 513.52234, "r_y1": 186.36395000000005, "r_x2": 513.52234, "r_y2": 177.4574, "r_x3": 50.112, "r_y3": 177.4574, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 219.83794999999998, "r_x1": 71.14743, "r_y1": 219.83794999999998, "r_x2": 71.14743, "r_y2": 210.93140000000005, "r_x3": 61.569, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.542038, "r_y0": 219.83794999999998, "r_x1": 286.36511, "r_y1": 219.83794999999998, "r_x2": 286.36511, "r_y2": 210.93140000000005, "r_x3": 73.542038, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 231.79296999999997, "r_x1": 87.47155, "r_y1": 231.79296999999997, "r_x2": 87.47155, "r_y2": 222.88640999999996, "r_x3": 70.037003, "r_y3": 222.88640999999996, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 252.97797000000003, "r_x1": 71.345718, "r_y1": 252.97797000000003, "r_x2": 71.345718, "r_y2": 244.07141000000001, "r_x3": 61.569, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.789902, "r_y0": 252.97797000000003, "r_x1": 286.36514, "r_y1": 252.97797000000003, "r_x2": 286.36514, "r_y2": 244.07141000000001, "r_x3": 73.789902, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 264.93298000000004, "r_x1": 150.41524, "r_y1": 264.93298000000004, "r_x2": 150.41524, "r_y2": 256.02643, "r_x3": 70.037003, "r_y3": 256.02643, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 288.10999, "r_x1": 286.36499, "r_y1": 288.10999, "r_x2": 286.36499, "r_y2": 279.20343, "r_x3": 62.067001, "r_y3": 279.20343, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.06497, "r_x1": 286.36505, "r_y1": 300.06497, "r_x2": 286.36505, "r_y2": 291.15842, "r_x3": 50.112, "r_y3": 291.15842, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.01996, "r_x1": 286.36511, "r_y1": 312.01996, "r_x2": 286.36511, "r_y2": 303.1134, "r_x3": 50.112, "r_y3": 303.1134, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 323.97495, "r_x1": 286.36511, "r_y1": 323.97495, "r_x2": 286.36511, "r_y2": 315.06839, "r_x3": 50.112, "r_y3": 315.06839, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 335.93093999999996, "r_x1": 286.36511, "r_y1": 335.93093999999996, "r_x2": 286.36511, "r_y2": 327.02438, "r_x3": 50.112, "r_y3": 327.02438, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 347.88593, "r_x1": 286.36505, "r_y1": 347.88593, "r_x2": 286.36505, "r_y2": 338.97937, "r_x3": 50.112, "r_y3": 338.97937, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.84091, "r_x1": 286.36508, "r_y1": 359.84091, "r_x2": 286.36508, "r_y2": 350.93436, "r_x3": 50.112, "r_y3": 350.93436, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.7959, "r_x1": 286.36511, "r_y1": 371.7959, "r_x2": 286.36511, "r_y2": 362.88934, "r_x3": 50.112, "r_y3": 362.88934, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 383.75089, "r_x1": 286.36508, "r_y1": 383.75089, "r_x2": 286.36508, "r_y2": 374.84433000000007, "r_x3": 50.112, "r_y3": 374.84433000000007, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 395.70688, "r_x1": 154.55988, "r_y1": 395.70688, "r_x2": 154.55988, "r_y2": 386.80032, "r_x3": 50.112, "r_y3": 386.80032, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 407.97589, "r_x1": 286.36496, "r_y1": 407.97589, "r_x2": 286.36496, "r_y2": 399.06934, "r_x3": 62.067001, "r_y3": 399.06934, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 419.93188, "r_x1": 95.491638, "r_y1": 419.93188, "r_x2": 95.491638, "r_y2": 411.02533, "r_x3": 50.112, "r_y3": 411.02533, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 432.20187, "r_x1": 69.37281, "r_y1": 432.20187, "r_x2": 69.37281, "r_y2": 423.29532, "r_x3": 62.067001, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.808075, "r_y0": 432.20187, "r_x1": 286.36502, "r_y1": 432.20187, "r_x2": 286.36502, "r_y2": 423.29532, "r_x3": 71.808075, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 444.15686, "r_x1": 286.36508, "r_y1": 444.15686, "r_x2": 286.36508, "r_y2": 435.25031, "r_x3": 50.112, "r_y3": 435.25031, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 456.11185000000006, "r_x1": 274.50958, "r_y1": 456.11185000000006, "r_x2": 274.50958, "r_y2": 447.20529, "r_x3": 50.112, "r_y3": 447.20529, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 468.38184, "r_x1": 69.538948, "r_y1": 468.38184, "r_x2": 69.538948, "r_y2": 459.47528, "r_x3": 62.067001, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.429329, "r_y0": 468.38184, "r_x1": 286.36499, "r_y1": 468.38184, "r_x2": 286.36499, "r_y2": 459.47528, "r_x3": 77.429329, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 480.33682, "r_x1": 286.36505, "r_y1": 480.33682, "r_x2": 286.36505, "r_y2": 471.43027, "r_x3": 50.112, "r_y3": 471.43027, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.29181, "r_x1": 286.36505, "r_y1": 492.29181, "r_x2": 286.36505, "r_y2": 483.38525, "r_x3": 50.112, "r_y3": 483.38525, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 504.2468, "r_x1": 110.70452999999999, "r_y1": 504.2468, "r_x2": 110.70452999999999, "r_y2": 495.34024, "r_x3": 50.112, "r_y3": 495.34024, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 516.5167799999999, "r_x1": 69.863068, "r_y1": 516.5167799999999, "r_x2": 69.863068, "r_y2": 507.61023, "r_x3": 62.067001, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.461754, "r_y0": 516.5167799999999, "r_x1": 286.36493, "r_y1": 516.5167799999999, "r_x2": 286.36493, "r_y2": 507.61023, "r_x3": 72.461754, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 528.4727800000001, "r_x1": 226.0714, "r_y1": 528.4727800000001, "r_x2": 226.0714, "r_y2": 519.5662199999999, "r_x3": 50.112, "r_y3": 519.5662199999999, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 540.7417800000001, "r_x1": 286.36496, "r_y1": 540.7417800000001, "r_x2": 286.36496, "r_y2": 531.83521, "r_x3": 62.067001, "r_y3": 531.83521, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 552.69777, "r_x1": 286.36511, "r_y1": 552.69777, "r_x2": 286.36511, "r_y2": 543.79121, "r_x3": 50.112, "r_y3": 543.79121, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 564.65277, "r_x1": 114.03204, "r_y1": 564.65277, "r_x2": 114.03204, "r_y2": 555.74622, "r_x3": 50.112, "r_y3": 555.74622, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 576.92278, "r_x1": 69.538948, "r_y1": 576.92278, "r_x2": 69.538948, "r_y2": 568.01622, "r_x3": 62.067001, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.731949, "r_y0": 576.92278, "r_x1": 286.36502, "r_y1": 576.92278, "r_x2": 286.36502, "r_y2": 568.01622, "r_x3": 76.731949, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 588.87778, "r_x1": 286.36508, "r_y1": 588.87778, "r_x2": 286.36508, "r_y2": 579.97122, "r_x3": 50.112, "r_y3": 579.97122, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 600.83278, "r_x1": 278.70383, "r_y1": 600.83278, "r_x2": 278.70383, "r_y2": 591.9262200000001, "r_x3": 50.112, "r_y3": 591.9262200000001, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.02799999999999, "r_y0": 632.84061, "r_x1": 157.9516, "r_y1": 632.84061, "r_x2": 157.9516, "r_y2": 623.99382, "r_x3": 112.02799999999999, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.715, "r_y0": 632.84061, "r_x1": 203.4964, "r_y1": 632.84061, "r_x2": 203.4964, "r_y2": 623.99382, "r_x3": 160.715, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58499, "r_y0": 640.17578, "r_x1": 189.14511, "r_y1": 640.17578, "r_x2": 189.14511, "r_y2": 633.98305, "r_x3": 185.58499, "r_y3": 633.98305, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.49899, "r_y0": 632.84061, "r_x1": 208.48029, "r_y1": 632.84061, "r_x2": 208.48029, "r_y2": 623.43591, "r_x3": 203.49899, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48099, "r_y0": 632.84061, "r_x1": 220.28911, "r_y1": 632.84061, "r_x2": 220.28911, "r_y2": 623.99382, "r_x3": 208.48099, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.78699, "r_y0": 632.84061, "r_x1": 225.76828, "r_y1": 632.84061, "r_x2": 225.76828, "r_y2": 623.43591, "r_x3": 220.78699, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.70499, "r_y0": 654.1056100000001, "r_x1": 122.51310999999998, "r_y1": 654.1056100000001, "r_x2": 122.51310999999998, "r_y2": 645.25882, "r_x3": 110.70499, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.77899000000001, "r_y0": 654.1056100000001, "r_x1": 133.52791, "r_y1": 654.1056100000001, "r_x2": 133.52791, "r_y2": 645.25882, "r_x3": 125.77899000000001, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.295, "r_y0": 654.1056100000001, "r_x1": 156.00201, "r_y1": 654.1056100000001, "r_x2": 156.00201, "r_y2": 645.25882, "r_x3": 136.295, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.00299, "r_y0": 654.1056100000001, "r_x1": 160.98428, "r_y1": 654.1056100000001, "r_x2": 160.98428, "r_y2": 644.70091, "r_x3": 156.00299, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98399, "r_y0": 654.1056100000001, "r_x1": 170.23811, "r_y1": 654.1056100000001, "r_x2": 170.23811, "r_y2": 645.25882, "r_x3": 160.98399, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.73599, "r_y0": 654.1056100000001, "r_x1": 185.6779, "r_y1": 654.1056100000001, "r_x2": 185.6779, "r_y2": 644.70091, "r_x3": 170.73599, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.894, "r_y0": 654.1056100000001, "r_x1": 206.05283, "r_y1": 654.1056100000001, "r_x2": 206.05283, "r_y2": 645.25882, "r_x3": 187.894, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.054, "r_y0": 654.1056100000001, "r_x1": 211.03529, "r_y1": 654.1056100000001, "r_x2": 211.03529, "r_y2": 644.70091, "r_x3": 206.054, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.035, "r_y0": 654.1056100000001, "r_x1": 220.28912, "r_y1": 654.1056100000001, "r_x2": 220.28912, "r_y2": 645.25882, "r_x3": 211.035, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.787, "r_y0": 654.1056100000001, "r_x1": 225.76829999999998, "r_y1": 654.1056100000001, "r_x2": 225.76829999999998, "r_y2": 644.70091, "r_x3": 220.787, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 643.79178, "r_x1": 286.3624, "r_y1": 643.79178, "r_x2": 286.3624, "r_y2": 634.88522, "r_x3": 274.746, "r_y3": 634.88522, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 676.97179, "r_x1": 74.45063, "r_y1": 676.97179, "r_x2": 74.45063, "r_y2": 668.06522, "r_x3": 50.112, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.335999, "r_y0": 676.75261, "r_x1": 82.647812, "r_y1": 676.75261, "r_x2": 82.647812, "r_y2": 667.90582, "r_x3": 78.335999, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.532997, "r_y0": 676.97179, "r_x1": 123.63372, "r_y1": 676.97179, "r_x2": 123.63372, "r_y2": 668.06522, "r_x3": 86.532997, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.51899999999999, "r_y0": 676.75261, "r_x1": 132.50029, "r_y1": 676.75261, "r_x2": 132.50029, "r_y2": 667.3479199999999, "r_x3": 127.51899999999999, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.50099, "r_y0": 676.97179, "r_x1": 210.69743, "r_y1": 676.97179, "r_x2": 210.69743, "r_y2": 668.06522, "r_x3": 132.50099, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.69699, "r_y0": 676.75261, "r_x1": 215.67828, "r_y1": 676.75261, "r_x2": 215.67828, "r_y2": 667.3479199999999, "r_x3": 210.69699, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56299, "r_y0": 676.97179, "r_x1": 233.94897000000003, "r_y1": 676.97179, "r_x2": 233.94897000000003, "r_y2": 668.06522, "r_x3": 219.56299, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83499000000003, "r_y0": 676.75261, "r_x1": 247.08911, "r_y1": 676.75261, "r_x2": 247.08911, "r_y2": 667.90582, "r_x3": 237.83499000000003, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47299000000004, "r_y0": 676.97179, "r_x1": 286.362, "r_y1": 676.97179, "r_x2": 286.362, "r_y2": 668.06522, "r_x3": 251.47299000000004, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 688.92679, "r_x1": 205.88721, "r_y1": 688.92679, "r_x2": 205.88721, "r_y2": 680.02022, "r_x3": 50.112, "r_y3": 680.02022, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 701.196785, "r_x1": 69.538948, "r_y1": 701.196785, "r_x2": 69.538948, "r_y2": 692.290222, "r_x3": 62.067001, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.273666, "r_y0": 701.196785, "r_x1": 286.36496, "r_y1": 701.196785, "r_x2": 286.36496, "r_y2": 692.290222, "r_x3": 76.273666, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.151787, "r_x1": 94.604973, "r_y1": 713.151787, "r_x2": 94.604973, "r_y2": 704.245224, "r_x3": 50.112, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.598999, "r_y0": 712.93261, "r_x1": 103.29263, "r_y1": 712.93261, "r_x2": 103.29263, "r_y2": 704.085815, "r_x3": 97.598999, "r_y3": 704.085815, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.292, "r_y0": 713.151787, "r_x1": 286.36481, "r_y1": 713.151787, "r_x2": 286.36481, "r_y2": 704.245224, "r_x3": 103.292, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 219.83776999999998, "r_x1": 545.11517, "r_y1": 219.83776999999998, "r_x2": 545.11517, "r_y2": 210.93120999999996, "r_x3": 308.862, "r_y3": 210.93120999999996, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 231.79376000000002, "r_x1": 545.11511, "r_y1": 231.79376000000002, "r_x2": 545.11511, "r_y2": 222.88720999999998, "r_x3": 308.862, "r_y3": 222.88720999999998, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 243.74878, "r_x1": 545.11511, "r_y1": 243.74878, "r_x2": 545.11511, "r_y2": 234.84222, "r_x3": 308.862, "r_y3": 234.84222, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 255.7038, "r_x1": 339.57669, "r_y1": 255.7038, "r_x2": 339.57669, "r_y2": 246.79724, "r_x3": 308.862, "r_y3": 246.79724, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 268.00879, "r_x1": 328.28894, "r_y1": 268.00879, "r_x2": 328.28894, "r_y2": 259.10222999999996, "r_x3": 320.81699, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88419, "r_y0": 268.00879, "r_x1": 545.11499, "r_y1": 268.00879, "r_x2": 545.11499, "r_y2": 259.10222999999996, "r_x3": 334.88419, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 279.96380999999997, "r_x1": 338.19189, "r_y1": 279.96380999999997, "r_x2": 338.19189, "r_y2": 271.05724999999995, "r_x3": 308.862, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68201, "r_y0": 279.74463000000003, "r_x1": 346.37564, "r_y1": 279.74463000000003, "r_x2": 346.37564, "r_y2": 270.89783, "r_x3": 340.68201, "r_y3": 270.89783, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37601, "r_y0": 279.96380999999997, "r_x1": 453.72305000000006, "r_y1": 279.96380999999997, "r_x2": 453.72305000000006, "r_y2": 271.05724999999995, "r_x3": 346.37601, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 292.26981, "r_x1": 328.38953, "r_y1": 292.26981, "r_x2": 328.38953, "r_y2": 283.36325000000005, "r_x3": 320.81702, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.9137, "r_y0": 292.26981, "r_x1": 545.11499, "r_y1": 292.26981, "r_x2": 545.11499, "r_y2": 283.36325000000005, "r_x3": 330.9137, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 304.22479, "r_x1": 545.11511, "r_y1": 304.22479, "r_x2": 545.11511, "r_y2": 295.31824, "r_x3": 308.86203, "r_y3": 295.31824, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 316.17978, "r_x1": 545.11505, "r_y1": 316.17978, "r_x2": 545.11505, "r_y2": 307.27322, "r_x3": 308.86203, "r_y3": 307.27322, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 328.13477, "r_x1": 545.11511, "r_y1": 328.13477, "r_x2": 545.11511, "r_y2": 319.22821000000005, "r_x3": 308.86203, "r_y3": 319.22821000000005, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 340.09076000000005, "r_x1": 397.19043, "r_y1": 340.09076000000005, "r_x2": 397.19043, "r_y2": 331.1842, "r_x3": 308.86203, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.65616, "r_y0": 340.09076000000005, "r_x1": 545.11511, "r_y1": 340.09076000000005, "r_x2": 545.11511, "r_y2": 331.1842, "r_x3": 403.65616, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 352.04575, "r_x1": 545.11511, "r_y1": 352.04575, "r_x2": 545.11511, "r_y2": 343.13919, "r_x3": 308.86203, "r_y3": 343.13919, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 364.00073, "r_x1": 545.11505, "r_y1": 364.00073, "r_x2": 545.11505, "r_y2": 355.09418, "r_x3": 308.86203, "r_y3": 355.09418, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 375.95572000000004, "r_x1": 545.11505, "r_y1": 375.95572000000004, "r_x2": 545.11505, "r_y2": 367.04916, "r_x3": 308.86203, "r_y3": 367.04916, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 387.91071, "r_x1": 329.61414, "r_y1": 387.91071, "r_x2": 329.61414, "r_y2": 379.00415, "r_x3": 308.86203, "r_y3": 379.00415, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 400.2167099999999, "r_x1": 328.55356, "r_y1": 400.2167099999999, "r_x2": 328.55356, "r_y2": 391.31015, "r_x3": 320.81702, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13242, "r_y0": 400.2167099999999, "r_x1": 545.11505, "r_y1": 400.2167099999999, "r_x2": 545.11505, "r_y2": 391.31015, "r_x3": 331.13242, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 412.17169, "r_x1": 545.11517, "r_y1": 412.17169, "r_x2": 545.11517, "r_y2": 403.26514, "r_x3": 308.86203, "r_y3": 403.26514, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 424.12668, "r_x1": 545.11511, "r_y1": 424.12668, "r_x2": 545.11511, "r_y2": 415.22012000000007, "r_x3": 308.86203, "r_y3": 415.22012000000007, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 436.0816699999999, "r_x1": 545.11511, "r_y1": 436.0816699999999, "r_x2": 545.11511, "r_y2": 427.17511, "r_x3": 308.86203, "r_y3": 427.17511, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 448.03665, "r_x1": 545.11505, "r_y1": 448.03665, "r_x2": 545.11505, "r_y2": 439.1301, "r_x3": 308.86203, "r_y3": 439.1301, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 459.99164, "r_x1": 426.18161, "r_y1": 459.99164, "r_x2": 426.18161, "r_y2": 451.08507999999995, "r_x3": 308.86203, "r_y3": 451.08507999999995, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 472.29764, "r_x1": 328.67316, "r_y1": 472.29764, "r_x2": 328.67316, "r_y2": 463.39108, "r_x3": 320.81702, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29187, "r_y0": 472.29764, "r_x1": 545.11499, "r_y1": 472.29764, "r_x2": 545.11499, "r_y2": 463.39108, "r_x3": 331.29187, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 484.25262, "r_x1": 545.11505, "r_y1": 484.25262, "r_x2": 545.11505, "r_y2": 475.34607, "r_x3": 308.86203, "r_y3": 475.34607, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 496.20761, "r_x1": 545.11517, "r_y1": 496.20761, "r_x2": 545.11517, "r_y2": 487.30106, "r_x3": 308.86203, "r_y3": 487.30106, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 508.1626, "r_x1": 381.89786, "r_y1": 508.1626, "r_x2": 381.89786, "r_y2": 499.25604, "r_x3": 308.86203, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7023, "r_y0": 508.1626, "r_x1": 545.11517, "r_y1": 508.1626, "r_x2": 545.11517, "r_y2": 499.25604, "r_x3": 388.7023, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 520.11859, "r_x1": 545.11511, "r_y1": 520.11859, "r_x2": 545.11511, "r_y2": 511.21204, "r_x3": 308.86203, "r_y3": 511.21204, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 532.07358, "r_x1": 545.11505, "r_y1": 532.07358, "r_x2": 545.11505, "r_y2": 523.16702, "r_x3": 308.86203, "r_y3": 523.16702, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 544.02858, "r_x1": 545.11499, "r_y1": 544.02858, "r_x2": 545.11499, "r_y2": 535.12201, "r_x3": 308.86203, "r_y3": 535.12201, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 555.98358, "r_x1": 545.11517, "r_y1": 555.98358, "r_x2": 545.11517, "r_y2": 547.07703, "r_x3": 308.86203, "r_y3": 547.07703, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 567.93858, "r_x1": 442.22147000000007, "r_y1": 567.93858, "r_x2": 442.22147000000007, "r_y2": 559.03203, "r_x3": 308.86203, "r_y3": 559.03203, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 580.24458, "r_x1": 545.11493, "r_y1": 580.24458, "r_x2": 545.11493, "r_y2": 571.33803, "r_x3": 320.81702, "r_y3": 571.33803, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 592.19958, "r_x1": 471.64093, "r_y1": 592.19958, "r_x2": 471.64093, "r_y2": 583.29303, "r_x3": 308.86203, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83405, "r_y0": 591.98041, "r_x1": 479.71872, "r_y1": 591.98041, "r_x2": 479.71872, "r_y2": 583.1336200000001, "r_x3": 474.83405, "r_y3": 583.1336200000001, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.26903999999996, "r_y0": 592.19958, "r_x1": 545.11688, "r_y1": 592.19958, "r_x2": 545.11688, "r_y2": 583.29303, "r_x3": 483.26903999999996, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 604.15459, "r_x1": 329.91306, "r_y1": 604.15459, "r_x2": 329.91306, "r_y2": 595.24803, "r_x3": 308.86206, "r_y3": 595.24803, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 616.4595899999999, "r_x1": 332.8718, "r_y1": 616.4595899999999, "r_x2": 332.8718, "r_y2": 607.55304, "r_x3": 320.81705, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.92532, "r_y0": 616.4595899999999, "r_x1": 545.11505, "r_y1": 616.4595899999999, "r_x2": 545.11505, "r_y2": 607.55304, "r_x3": 339.92532, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 628.4155900000001, "r_x1": 495.2923, "r_y1": 628.4155900000001, "r_x2": 495.2923, "r_y2": 619.50903, "r_x3": 308.86206, "r_y3": 619.50903, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 640.72058, "r_x1": 545.11505, "r_y1": 640.72058, "r_x2": 545.11505, "r_y2": 631.81403, "r_x3": 320.81705, "r_y3": 631.81403, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 652.67558, "r_x1": 455.28238, "r_y1": 652.67558, "r_x2": 455.28238, "r_y2": 643.7690299999999, "r_x3": 308.86206, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.77704, "r_y0": 652.45641, "r_x1": 463.47067, "r_y1": 652.45641, "r_x2": 463.47067, "r_y2": 643.60962, "r_x3": 457.77704, "r_y3": 643.60962, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97104, "r_y0": 652.67558, "r_x1": 545.11389, "r_y1": 652.67558, "r_x2": 545.11389, "r_y2": 643.7690299999999, "r_x3": 465.97104, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 664.63059, "r_x1": 332.38376, "r_y1": 664.63059, "r_x2": 332.38376, "r_y2": 655.72403, "r_x3": 308.86206, "r_y3": 655.72403, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 676.93659, "r_x1": 545.11499, "r_y1": 676.93659, "r_x2": 545.11499, "r_y2": 668.03003, "r_x3": 320.81705, "r_y3": 668.03003, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 688.89159, "r_x1": 510.5848700000001, "r_y1": 688.89159, "r_x2": 510.5848700000001, "r_y2": 679.98503, "r_x3": 308.86206, "r_y3": 679.98503, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 701.196594, "r_x1": 545.11505, "r_y1": 701.196594, "r_x2": 545.11505, "r_y2": 692.290024, "r_x3": 320.81705, "r_y3": 692.290024, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 713.151596, "r_x1": 545.11517, "r_y1": 713.151596, "r_x2": 545.11517, "r_y2": 704.245026, "r_x3": 308.86206, "r_y3": 704.245026, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63107, "r_y0": 743.039593, "r_x1": 302.59366, "r_y1": 743.039593, "r_x2": 302.59366, "r_y2": 734.13303, "r_x3": 292.63107, "r_y3": 734.13303, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 30, "label": "picture", "bbox": { "l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT" }, "confidence": 0.6033818125724792, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39108, "r_y0": 83.25922000000003, "r_x1": 151.94641, "r_y1": 83.25922000000003, "r_x2": 151.94641, "r_y2": 77.31055000000003, "r_x3": 119.39108, "r_y3": 77.31055000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.345978, "r_y0": 81.14020000000005, "r_x1": 59.327053, "r_y1": 81.14020000000005, "r_x2": 59.327053, "r_y2": 75.19152999999994, "r_x3": 53.345978, "r_y3": 75.19152999999994, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.5791, "r_y0": 83.40698000000009, "r_x1": 319.8266, "r_y1": 83.40698000000009, "r_x2": 319.8266, "r_y2": 77.45830999999998, "r_x3": 289.5791, "r_y3": 77.45830999999998, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37271, "r_y0": 83.20263999999997, "r_x1": 481.75916, "r_y1": 83.20263999999997, "r_x2": 481.75916, "r_y2": 77.25396999999987, "r_x3": 448.37271, "r_y3": 77.25396999999987, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.553436, "r_y0": 146.23339999999996, "r_x1": 94.976013, "r_y1": 146.23339999999996, "r_x2": 94.976013, "r_y2": 141.27617999999995, "r_x3": 82.553436, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.03878399999999, "r_y0": 106.06133999999986, "r_x1": 85.290085, "r_y1": 106.06133999999986, "r_x2": 85.290085, "r_y2": 101.10413000000005, "r_x3": 63.03878399999999, "r_y3": 101.10413000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.76786, "r_y0": 129.35253999999998, "r_x1": 85.231277, "r_y1": 129.35253999999998, "r_x2": 85.231277, "r_y2": 124.39531999999997, "r_x3": 67.76786, "r_y3": 124.39531999999997, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55121, "r_y0": 107.49712999999997, "r_x1": 249.80251, "r_y1": 107.49712999999997, "r_x2": 249.80251, "r_y2": 102.53992000000005, "r_x3": 227.55121, "r_y3": 102.53992000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.19898999999998, "r_y0": 131.94299, "r_x1": 249.66241, "r_y1": 131.94299, "r_x2": 249.66241, "r_y2": 126.98577999999986, "r_x3": 232.19898999999998, "r_y3": 126.98577999999986, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2337, "r_y0": 119.00243999999998, "r_x1": 413.69711, "r_y1": 119.00243999999998, "r_x2": 413.69711, "r_y2": 114.04522999999995, "r_x3": 396.2337, "r_y3": 114.04522999999995, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.382202, "r_y0": 146.23339999999996, "r_x1": 105.08014, "r_y1": 146.23339999999996, "r_x2": 105.08014, "r_y2": 141.27617999999995, "r_x3": 97.382202, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.93763400000001, "r_y0": 90.69042999999999, "r_x1": 76.151443, "r_y1": 90.69042999999999, "r_x2": 76.151443, "r_y2": 85.73321999999996, "r_x3": 60.93763400000001, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.304901, "r_y0": 91.18073000000015, "r_x1": 106.99162, "r_y1": 91.18073000000015, "r_x2": 106.99162, "r_y2": 86.22351000000003, "r_x3": 82.304901, "r_y3": 86.22351000000003, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.20530999999997, "r_y0": 146.56329000000005, "r_x1": 281.88013, "r_y1": 146.56329000000005, "r_x2": 281.88013, "r_y2": 141.60608000000002, "r_x3": 246.20530999999997, "r_y3": 141.60608000000002, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.69780000000003, "r_y0": 90.69042999999999, "r_x1": 241.91161, "r_y1": 90.69042999999999, "r_x2": 241.91161, "r_y2": 85.73321999999996, "r_x3": 226.69780000000003, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.93848999999997, "r_y0": 91.04522999999995, "r_x1": 282.49384, "r_y1": 91.04522999999995, "r_x2": 282.49384, "r_y2": 86.08801000000005, "r_x3": 249.93848999999997, "r_y3": 86.08801000000005, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19409, "r_y0": 146.23339999999996, "r_x1": 444.68915, "r_y1": 146.23339999999996, "r_x2": 444.68915, "r_y2": 141.27617999999995, "r_x3": 410.19409, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37341, "r_y0": 90.69042999999999, "r_x1": 432.6716599999999, "r_y1": 90.69042999999999, "r_x2": 432.6716599999999, "r_y2": 85.73321999999996, "r_x3": 391.37341, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.60571000000004, "r_y0": 91.21862999999996, "r_x1": 445.62414999999993, "r_y1": 91.21862999999996, "r_x2": 445.62414999999993, "r_y2": 86.26140999999996, "r_x3": 435.60571000000004, "r_y3": 86.26140999999996, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.94921, "r_y0": 146.24567000000002, "r_x1": 136.20052, "r_y1": 146.24567000000002, "r_x2": 136.20052, "r_y2": 141.28845, "r_x3": 113.94921, "r_y3": 141.28845, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.91554000000001, "r_y0": 99.77575999999999, "r_x1": 127.05433999999998, "r_y1": 99.77575999999999, "r_x2": 127.05433999999998, "r_y2": 94.81853999999998, "r_x3": 116.91554000000001, "r_y3": 94.81853999999998, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.3146, "r_y0": 105.89575000000002, "r_x1": 127.05298, "r_y1": 105.89575000000002, "r_x2": 127.05298, "r_y2": 100.93853999999999, "r_x3": 113.3146, "r_y3": 100.93853999999999, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94112, "r_y0": 112.01575000000003, "r_x1": 127.05537, "r_y1": 112.01575000000003, "r_x2": 127.05537, "r_y2": 107.05853000000013, "r_x3": 112.94112, "r_y3": 107.05853000000013, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.22738999999999, "r_y0": 127.57245, "r_x1": 126.96577, "r_y1": 127.57245, "r_x2": 126.96577, "r_y2": 122.61523, "r_x3": 113.22738999999999, "r_y3": 122.61523, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85390000000001, "r_y0": 133.69244000000003, "r_x1": 126.96814999999998, "r_y1": 133.69244000000003, "r_x2": 126.96814999999998, "r_y2": 128.73523, "r_x3": 112.85390000000001, "r_y3": 128.73523, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.57864, "r_y0": 146.39362000000006, "r_x1": 156.04207, "r_y1": 146.39362000000006, "r_x2": 156.04207, "r_y2": 141.43640000000005, "r_x3": 138.57864, "r_y3": 141.43640000000005, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03101, "r_y0": 91.22852, "r_x1": 151.04185, "r_y1": 91.22852, "r_x2": 151.04185, "r_y2": 86.2713, "r_x3": 122.03101, "r_y3": 86.2713, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65359, "r_y0": 91.5122100000001, "r_x1": 321.67203, "r_y1": 91.5122100000001, "r_x2": 321.67203, "r_y2": 86.55498999999998, "r_x3": 311.65359, "r_y3": 86.55498999999998, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89441, "r_y0": 146.66785000000004, "r_x1": 310.14572, "r_y1": 146.66785000000004, "r_x2": 310.14572, "r_y2": 141.71063000000004, "r_x3": 287.89441, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.23572, "r_y0": 98.03698999999995, "r_x1": 299.37451, "r_y1": 98.03698999999995, "r_x2": 299.37451, "r_y2": 93.07977000000005, "r_x3": 289.23572, "r_y3": 93.07977000000005, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63513, "r_y0": 104.15698000000009, "r_x1": 299.3735, "r_y1": 104.15698000000009, "r_x2": 299.3735, "r_y2": 99.19976999999994, "r_x3": 285.63513, "r_y3": 99.19976999999994, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26111, "r_y0": 110.27697999999998, "r_x1": 299.37537, "r_y1": 110.27697999999998, "r_x2": 299.37537, "r_y2": 105.31975999999997, "r_x3": 285.26111, "r_y3": 105.31975999999997, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43109, "r_y0": 125.34717, "r_x1": 299.16946, "r_y1": 125.34717, "r_x2": 299.16946, "r_y2": 120.38995, "r_x3": 285.43109, "r_y3": 120.38995, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.05713, "r_y0": 131.46716000000004, "r_x1": 299.17139, "r_y1": 131.46716000000004, "r_x2": 299.17139, "r_y2": 126.50995, "r_x3": 285.05713, "r_y3": 126.50995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.34592, "r_y0": 146.66785000000004, "r_x1": 328.80933, "r_y1": 146.66785000000004, "r_x2": 328.80933, "r_y2": 141.71063000000004, "r_x3": 311.34592, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58362, "r_y0": 91.65075999999999, "r_x1": 309.60205, "r_y1": 91.65075999999999, "r_x2": 309.60205, "r_y2": 86.69353999999998, "r_x3": 299.58362, "r_y3": 86.69353999999998, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04077000000007, "r_y0": 146.62891000000002, "r_x1": 483.50418, "r_y1": 146.62891000000002, "r_x2": 483.50418, "r_y2": 141.67169, "r_x3": 466.04077000000007, "r_y3": 141.67169, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02151, "r_y0": 98.71838000000002, "r_x1": 469.16031000000004, "r_y1": 98.71838000000002, "r_x2": 469.16031000000004, "r_y2": 93.76116999999999, "r_x3": 459.02151, "r_y3": 93.76116999999999, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.4209, "r_y0": 104.83838000000003, "r_x1": 469.15927000000005, "r_y1": 104.83838000000003, "r_x2": 469.15927000000005, "r_y2": 99.88116000000002, "r_x3": 455.4209, "r_y3": 99.88116000000002, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.04691, "r_y0": 110.95836999999995, "r_x1": 469.16115999999994, "r_y1": 110.95836999999995, "r_x2": 469.16115999999994, "r_y2": 106.00116000000014, "r_x3": 455.04691, "r_y3": 106.00116000000014, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39401, "r_y0": 90.52959999999996, "r_x1": 480.6545100000001, "r_y1": 90.52959999999996, "r_x2": 480.6545100000001, "r_y2": 85.57239000000004, "r_x3": 467.39401, "r_y3": 85.57239000000004, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37672, "r_y0": 146.54107999999997, "r_x1": 182.62802, "r_y1": 146.54107999999997, "r_x2": 182.62802, "r_y2": 141.58385999999996, "r_x3": 160.37672, "r_y3": 141.58385999999996, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74265, "r_y0": 99.82201999999995, "r_x1": 173.32664, "r_y1": 99.82201999999995, "r_x2": 173.32664, "r_y2": 94.86481000000003, "r_x3": 153.74265, "r_y3": 94.86481000000003, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50967, "r_y0": 105.94202000000007, "r_x1": 173.3246, "r_y1": 105.94202000000007, "r_x2": 173.3246, "r_y2": 100.98479999999995, "r_x3": 154.50967, "r_y3": 100.98479999999995, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27162, "r_y0": 112.06200999999987, "r_x1": 173.32664, "r_y1": 112.06200999999987, "r_x2": 173.32664, "r_y2": 107.10479999999995, "r_x3": 155.27162, "r_y3": 107.10479999999995, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41302, "r_y0": 112.18970000000002, "r_x1": 345.99701, "r_y1": 112.18970000000002, "r_x2": 345.99701, "r_y2": 107.23248000000001, "r_x3": 326.41302, "r_y3": 107.23248000000001, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.17972, "r_y0": 118.30969000000005, "r_x1": 345.99463, "r_y1": 118.30969000000005, "r_x2": 345.99463, "r_y2": 113.35248000000001, "r_x3": 327.17972, "r_y3": 113.35248000000001, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94131, "r_y0": 124.42969000000005, "r_x1": 345.99634, "r_y1": 124.42969000000005, "r_x2": 345.99634, "r_y2": 119.47247000000004, "r_x3": 327.94131, "r_y3": 119.47247000000004, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.9942, "r_y0": 109.11095999999998, "r_x1": 508.76384999999993, "r_y1": 109.11095999999998, "r_x2": 508.76384999999993, "r_y2": 104.15374999999983, "r_x3": 488.9942, "r_y3": 104.15374999999983, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.1893, "r_y0": 115.2309600000001, "r_x1": 508.76349000000005, "r_y1": 115.2309600000001, "r_x2": 508.76349000000005, "r_y2": 110.27373999999998, "r_x3": 490.1893, "r_y3": 110.27373999999998, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72009, "r_y0": 121.35095000000013, "r_x1": 508.76758, "r_y1": 121.35095000000013, "r_x2": 508.76758, "r_y2": 116.39373999999998, "r_x3": 489.72009, "r_y3": 116.39373999999998, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71121, "r_y0": 127.47095000000002, "r_x1": 508.76624, "r_y1": 127.47095000000002, "r_x2": 508.76624, "r_y2": 122.51373000000001, "r_x3": 490.71121, "r_y3": 122.51373000000001, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.37759, "r_y0": 146.66840000000002, "r_x1": 202.84102, "r_y1": 146.66840000000002, "r_x2": 202.84102, "r_y2": 141.71118, "r_x3": 185.37759, "r_y3": 141.71118, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.50357, "r_y0": 91.09331999999995, "r_x1": 197.52699, "r_y1": 91.09331999999995, "r_x2": 197.52699, "r_y2": 86.13611000000003, "r_x3": 168.50357, "r_y3": 86.13611000000003, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.3768, "r_y0": 90.95428000000004, "r_x1": 367.39523, "r_y1": 90.95428000000004, "r_x2": 367.39523, "r_y2": 85.99707000000001, "r_x3": 357.3768, "r_y3": 85.99707000000001, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73151, "r_y0": 146.58043999999995, "r_x1": 374.92862, "r_y1": 146.58043999999995, "r_x2": 374.92862, "r_y2": 141.62323000000004, "r_x3": 333.73151, "r_y3": 141.62323000000004, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69101, "r_y0": 91.01312000000007, "r_x1": 355.70944, "r_y1": 91.01312000000007, "r_x2": 355.70944, "r_y2": 86.05591000000004, "r_x3": 345.69101, "r_y3": 86.05591000000004, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54248, "r_y0": 146.33405000000005, "r_x1": 526.00592, "r_y1": 146.33405000000005, "r_x2": 526.00592, "r_y2": 141.37683000000004, "r_x3": 508.54248, "r_y3": 141.37683000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.44653000000005, "r_y0": 91.0498, "r_x1": 523.70703, "r_y1": 91.0498, "r_x2": 523.70703, "r_y2": 86.09258999999986, "r_x3": 510.44653000000005, "r_y3": 86.09258999999986, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 46, "label": "text", "bbox": { "l": 119.39108, "t": 77.31055000000003, "r": 151.94641, "b": 83.25922000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39108, "r_y0": 83.25922000000003, "r_x1": 151.94641, "r_y1": 83.25922000000003, "r_x2": 151.94641, "r_y2": 77.31055000000003, "r_x3": 119.39108, "r_y3": 77.31055000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 53.345978, "t": 75.19152999999994, "r": 59.327053, "b": 81.14020000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.345978, "r_y0": 81.14020000000005, "r_x1": 59.327053, "r_y1": 81.14020000000005, "r_x2": 59.327053, "r_y2": 75.19152999999994, "r_x3": 53.345978, "r_y3": 75.19152999999994, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 289.5791, "t": 77.45830999999998, "r": 319.8266, "b": 83.40698000000009, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.5791, "r_y0": 83.40698000000009, "r_x1": 319.8266, "r_y1": 83.40698000000009, "r_x2": 319.8266, "r_y2": 77.45830999999998, "r_x3": 289.5791, "r_y3": 77.45830999999998, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 448.37271, "t": 77.25396999999987, "r": 481.75916, "b": 83.20263999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37271, "r_y0": 83.20263999999997, "r_x1": 481.75916, "r_y1": 83.20263999999997, "r_x2": 481.75916, "r_y2": 77.25396999999987, "r_x3": 448.37271, "r_y3": 77.25396999999987, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 82.553436, "t": 141.27617999999995, "r": 94.976013, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.553436, "r_y0": 146.23339999999996, "r_x1": 94.976013, "r_y1": 146.23339999999996, "r_x2": 94.976013, "r_y2": 141.27617999999995, "r_x3": 82.553436, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 63.03878399999999, "t": 101.10413000000005, "r": 85.290085, "b": 106.06133999999986, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.03878399999999, "r_y0": 106.06133999999986, "r_x1": 85.290085, "r_y1": 106.06133999999986, "r_x2": 85.290085, "r_y2": 101.10413000000005, "r_x3": 63.03878399999999, "r_y3": 101.10413000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 67.76786, "t": 124.39531999999997, "r": 85.231277, "b": 129.35253999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.76786, "r_y0": 129.35253999999998, "r_x1": 85.231277, "r_y1": 129.35253999999998, "r_x2": 85.231277, "r_y2": 124.39531999999997, "r_x3": 67.76786, "r_y3": 124.39531999999997, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 227.55121, "t": 102.53992000000005, "r": 249.80251, "b": 107.49712999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55121, "r_y0": 107.49712999999997, "r_x1": 249.80251, "r_y1": 107.49712999999997, "r_x2": 249.80251, "r_y2": 102.53992000000005, "r_x3": 227.55121, "r_y3": 102.53992000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 232.19898999999998, "t": 126.98577999999986, "r": 249.66241, "b": 131.94299, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.19898999999998, "r_y0": 131.94299, "r_x1": 249.66241, "r_y1": 131.94299, "r_x2": 249.66241, "r_y2": 126.98577999999986, "r_x3": 232.19898999999998, "r_y3": 126.98577999999986, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 396.2337, "t": 114.04522999999995, "r": 413.69711, "b": 119.00243999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2337, "r_y0": 119.00243999999998, "r_x1": 413.69711, "r_y1": 119.00243999999998, "r_x2": 413.69711, "r_y2": 114.04522999999995, "r_x3": 396.2337, "r_y3": 114.04522999999995, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 97.382202, "t": 141.27617999999995, "r": 105.08014, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.382202, "r_y0": 146.23339999999996, "r_x1": 105.08014, "r_y1": 146.23339999999996, "r_x2": 105.08014, "r_y2": 141.27617999999995, "r_x3": 97.382202, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 60.93763400000001, "t": 85.73321999999996, "r": 76.151443, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.93763400000001, "r_y0": 90.69042999999999, "r_x1": 76.151443, "r_y1": 90.69042999999999, "r_x2": 76.151443, "r_y2": 85.73321999999996, "r_x3": 60.93763400000001, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 82.304901, "t": 86.22351000000003, "r": 106.99162, "b": 91.18073000000015, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.304901, "r_y0": 91.18073000000015, "r_x1": 106.99162, "r_y1": 91.18073000000015, "r_x2": 106.99162, "r_y2": 86.22351000000003, "r_x3": 82.304901, "r_y3": 86.22351000000003, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 246.20530999999997, "t": 141.60608000000002, "r": 281.88013, "b": 146.56329000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.20530999999997, "r_y0": 146.56329000000005, "r_x1": 281.88013, "r_y1": 146.56329000000005, "r_x2": 281.88013, "r_y2": 141.60608000000002, "r_x3": 246.20530999999997, "r_y3": 141.60608000000002, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 226.69780000000003, "t": 85.73321999999996, "r": 241.91161, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.69780000000003, "r_y0": 90.69042999999999, "r_x1": 241.91161, "r_y1": 90.69042999999999, "r_x2": 241.91161, "r_y2": 85.73321999999996, "r_x3": 226.69780000000003, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 249.93848999999997, "t": 86.08801000000005, "r": 282.49384, "b": 91.04522999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.93848999999997, "r_y0": 91.04522999999995, "r_x1": 282.49384, "r_y1": 91.04522999999995, "r_x2": 282.49384, "r_y2": 86.08801000000005, "r_x3": 249.93848999999997, "r_y3": 86.08801000000005, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 410.19409, "t": 141.27617999999995, "r": 444.68915, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19409, "r_y0": 146.23339999999996, "r_x1": 444.68915, "r_y1": 146.23339999999996, "r_x2": 444.68915, "r_y2": 141.27617999999995, "r_x3": 410.19409, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 391.37341, "t": 85.73321999999996, "r": 432.6716599999999, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37341, "r_y0": 90.69042999999999, "r_x1": 432.6716599999999, "r_y1": 90.69042999999999, "r_x2": 432.6716599999999, "r_y2": 85.73321999999996, "r_x3": 391.37341, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 435.60571000000004, "t": 86.26140999999996, "r": 445.62414999999993, "b": 91.21862999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.60571000000004, "r_y0": 91.21862999999996, "r_x1": 445.62414999999993, "r_y1": 91.21862999999996, "r_x2": 445.62414999999993, "r_y2": 86.26140999999996, "r_x3": 435.60571000000004, "r_y3": 86.26140999999996, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 113.94921, "t": 141.28845, "r": 136.20052, "b": 146.24567000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.94921, "r_y0": 146.24567000000002, "r_x1": 136.20052, "r_y1": 146.24567000000002, "r_x2": 136.20052, "r_y2": 141.28845, "r_x3": 113.94921, "r_y3": 141.28845, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 116.91554000000001, "t": 94.81853999999998, "r": 127.05433999999998, "b": 99.77575999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.91554000000001, "r_y0": 99.77575999999999, "r_x1": 127.05433999999998, "r_y1": 99.77575999999999, "r_x2": 127.05433999999998, "r_y2": 94.81853999999998, "r_x3": 116.91554000000001, "r_y3": 94.81853999999998, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 113.3146, "t": 100.93853999999999, "r": 127.05298, "b": 105.89575000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.3146, "r_y0": 105.89575000000002, "r_x1": 127.05298, "r_y1": 105.89575000000002, "r_x2": 127.05298, "r_y2": 100.93853999999999, "r_x3": 113.3146, "r_y3": 100.93853999999999, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 112.94112, "t": 107.05853000000013, "r": 127.05537, "b": 112.01575000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94112, "r_y0": 112.01575000000003, "r_x1": 127.05537, "r_y1": 112.01575000000003, "r_x2": 127.05537, "r_y2": 107.05853000000013, "r_x3": 112.94112, "r_y3": 107.05853000000013, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 113.22738999999999, "t": 122.61523, "r": 126.96577, "b": 127.57245, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.22738999999999, "r_y0": 127.57245, "r_x1": 126.96577, "r_y1": 127.57245, "r_x2": 126.96577, "r_y2": 122.61523, "r_x3": 113.22738999999999, "r_y3": 122.61523, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 112.85390000000001, "t": 128.73523, "r": 126.96814999999998, "b": 133.69244000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85390000000001, "r_y0": 133.69244000000003, "r_x1": 126.96814999999998, "r_y1": 133.69244000000003, "r_x2": 126.96814999999998, "r_y2": 128.73523, "r_x3": 112.85390000000001, "r_y3": 128.73523, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 138.57864, "t": 141.43640000000005, "r": 156.04207, "b": 146.39362000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.57864, "r_y0": 146.39362000000006, "r_x1": 156.04207, "r_y1": 146.39362000000006, "r_x2": 156.04207, "r_y2": 141.43640000000005, "r_x3": 138.57864, "r_y3": 141.43640000000005, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 122.03101, "t": 86.2713, "r": 151.04185, "b": 91.22852, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03101, "r_y0": 91.22852, "r_x1": 151.04185, "r_y1": 91.22852, "r_x2": 151.04185, "r_y2": 86.2713, "r_x3": 122.03101, "r_y3": 86.2713, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 311.65359, "t": 86.55498999999998, "r": 321.67203, "b": 91.5122100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65359, "r_y0": 91.5122100000001, "r_x1": 321.67203, "r_y1": 91.5122100000001, "r_x2": 321.67203, "r_y2": 86.55498999999998, "r_x3": 311.65359, "r_y3": 86.55498999999998, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 287.89441, "t": 141.71063000000004, "r": 310.14572, "b": 146.66785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89441, "r_y0": 146.66785000000004, "r_x1": 310.14572, "r_y1": 146.66785000000004, "r_x2": 310.14572, "r_y2": 141.71063000000004, "r_x3": 287.89441, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.23572, "t": 93.07977000000005, "r": 299.37451, "b": 98.03698999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.23572, "r_y0": 98.03698999999995, "r_x1": 299.37451, "r_y1": 98.03698999999995, "r_x2": 299.37451, "r_y2": 93.07977000000005, "r_x3": 289.23572, "r_y3": 93.07977000000005, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 285.63513, "t": 99.19976999999994, "r": 299.3735, "b": 104.15698000000009, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63513, "r_y0": 104.15698000000009, "r_x1": 299.3735, "r_y1": 104.15698000000009, "r_x2": 299.3735, "r_y2": 99.19976999999994, "r_x3": 285.63513, "r_y3": 99.19976999999994, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 285.26111, "t": 105.31975999999997, "r": 299.37537, "b": 110.27697999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26111, "r_y0": 110.27697999999998, "r_x1": 299.37537, "r_y1": 110.27697999999998, "r_x2": 299.37537, "r_y2": 105.31975999999997, "r_x3": 285.26111, "r_y3": 105.31975999999997, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 285.43109, "t": 120.38995, "r": 299.16946, "b": 125.34717, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43109, "r_y0": 125.34717, "r_x1": 299.16946, "r_y1": 125.34717, "r_x2": 299.16946, "r_y2": 120.38995, "r_x3": 285.43109, "r_y3": 120.38995, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 285.05713, "t": 126.50995, "r": 299.17139, "b": 131.46716000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.05713, "r_y0": 131.46716000000004, "r_x1": 299.17139, "r_y1": 131.46716000000004, "r_x2": 299.17139, "r_y2": 126.50995, "r_x3": 285.05713, "r_y3": 126.50995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 311.34592, "t": 141.71063000000004, "r": 328.80933, "b": 146.66785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.34592, "r_y0": 146.66785000000004, "r_x1": 328.80933, "r_y1": 146.66785000000004, "r_x2": 328.80933, "r_y2": 141.71063000000004, "r_x3": 311.34592, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 299.58362, "t": 86.69353999999998, "r": 309.60205, "b": 91.65075999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58362, "r_y0": 91.65075999999999, "r_x1": 309.60205, "r_y1": 91.65075999999999, "r_x2": 309.60205, "r_y2": 86.69353999999998, "r_x3": 299.58362, "r_y3": 86.69353999999998, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 466.04077000000007, "t": 141.67169, "r": 483.50418, "b": 146.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04077000000007, "r_y0": 146.62891000000002, "r_x1": 483.50418, "r_y1": 146.62891000000002, "r_x2": 483.50418, "r_y2": 141.67169, "r_x3": 466.04077000000007, "r_y3": 141.67169, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 459.02151, "t": 93.76116999999999, "r": 469.16031000000004, "b": 98.71838000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02151, "r_y0": 98.71838000000002, "r_x1": 469.16031000000004, "r_y1": 98.71838000000002, "r_x2": 469.16031000000004, "r_y2": 93.76116999999999, "r_x3": 459.02151, "r_y3": 93.76116999999999, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 455.4209, "t": 99.88116000000002, "r": 469.15927000000005, "b": 104.83838000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.4209, "r_y0": 104.83838000000003, "r_x1": 469.15927000000005, "r_y1": 104.83838000000003, "r_x2": 469.15927000000005, "r_y2": 99.88116000000002, "r_x3": 455.4209, "r_y3": 99.88116000000002, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 455.04691, "t": 106.00116000000014, "r": 469.16115999999994, "b": 110.95836999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.04691, "r_y0": 110.95836999999995, "r_x1": 469.16115999999994, "r_y1": 110.95836999999995, "r_x2": 469.16115999999994, "r_y2": 106.00116000000014, "r_x3": 455.04691, "r_y3": 106.00116000000014, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 467.39401, "t": 85.57239000000004, "r": 480.6545100000001, "b": 90.52959999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39401, "r_y0": 90.52959999999996, "r_x1": 480.6545100000001, "r_y1": 90.52959999999996, "r_x2": 480.6545100000001, "r_y2": 85.57239000000004, "r_x3": 467.39401, "r_y3": 85.57239000000004, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 160.37672, "t": 141.58385999999996, "r": 182.62802, "b": 146.54107999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37672, "r_y0": 146.54107999999997, "r_x1": 182.62802, "r_y1": 146.54107999999997, "r_x2": 182.62802, "r_y2": 141.58385999999996, "r_x3": 160.37672, "r_y3": 141.58385999999996, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 153.74265, "t": 94.86481000000003, "r": 173.32664, "b": 99.82201999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74265, "r_y0": 99.82201999999995, "r_x1": 173.32664, "r_y1": 99.82201999999995, "r_x2": 173.32664, "r_y2": 94.86481000000003, "r_x3": 153.74265, "r_y3": 94.86481000000003, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 154.50967, "t": 100.98479999999995, "r": 173.3246, "b": 105.94202000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50967, "r_y0": 105.94202000000007, "r_x1": 173.3246, "r_y1": 105.94202000000007, "r_x2": 173.3246, "r_y2": 100.98479999999995, "r_x3": 154.50967, "r_y3": 100.98479999999995, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 155.27162, "t": 107.10479999999995, "r": 173.32664, "b": 112.06200999999987, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27162, "r_y0": 112.06200999999987, "r_x1": 173.32664, "r_y1": 112.06200999999987, "r_x2": 173.32664, "r_y2": 107.10479999999995, "r_x3": 155.27162, "r_y3": 107.10479999999995, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.41302, "t": 107.23248000000001, "r": 345.99701, "b": 112.18970000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41302, "r_y0": 112.18970000000002, "r_x1": 345.99701, "r_y1": 112.18970000000002, "r_x2": 345.99701, "r_y2": 107.23248000000001, "r_x3": 326.41302, "r_y3": 107.23248000000001, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 327.17972, "t": 113.35248000000001, "r": 345.99463, "b": 118.30969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.17972, "r_y0": 118.30969000000005, "r_x1": 345.99463, "r_y1": 118.30969000000005, "r_x2": 345.99463, "r_y2": 113.35248000000001, "r_x3": 327.17972, "r_y3": 113.35248000000001, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 327.94131, "t": 119.47247000000004, "r": 345.99634, "b": 124.42969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94131, "r_y0": 124.42969000000005, "r_x1": 345.99634, "r_y1": 124.42969000000005, "r_x2": 345.99634, "r_y2": 119.47247000000004, "r_x3": 327.94131, "r_y3": 119.47247000000004, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 488.9942, "t": 104.15374999999983, "r": 508.76384999999993, "b": 109.11095999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.9942, "r_y0": 109.11095999999998, "r_x1": 508.76384999999993, "r_y1": 109.11095999999998, "r_x2": 508.76384999999993, "r_y2": 104.15374999999983, "r_x3": 488.9942, "r_y3": 104.15374999999983, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 490.1893, "t": 110.27373999999998, "r": 508.76349000000005, "b": 115.2309600000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.1893, "r_y0": 115.2309600000001, "r_x1": 508.76349000000005, "r_y1": 115.2309600000001, "r_x2": 508.76349000000005, "r_y2": 110.27373999999998, "r_x3": 490.1893, "r_y3": 110.27373999999998, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 489.72009, "t": 116.39373999999998, "r": 508.76758, "b": 121.35095000000013, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72009, "r_y0": 121.35095000000013, "r_x1": 508.76758, "r_y1": 121.35095000000013, "r_x2": 508.76758, "r_y2": 116.39373999999998, "r_x3": 489.72009, "r_y3": 116.39373999999998, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 490.71121, "t": 122.51373000000001, "r": 508.76624, "b": 127.47095000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71121, "r_y0": 127.47095000000002, "r_x1": 508.76624, "r_y1": 127.47095000000002, "r_x2": 508.76624, "r_y2": 122.51373000000001, "r_x3": 490.71121, "r_y3": 122.51373000000001, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 185.37759, "t": 141.71118, "r": 202.84102, "b": 146.66840000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.37759, "r_y0": 146.66840000000002, "r_x1": 202.84102, "r_y1": 146.66840000000002, "r_x2": 202.84102, "r_y2": 141.71118, "r_x3": 185.37759, "r_y3": 141.71118, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 168.50357, "t": 86.13611000000003, "r": 197.52699, "b": 91.09331999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.50357, "r_y0": 91.09331999999995, "r_x1": 197.52699, "r_y1": 91.09331999999995, "r_x2": 197.52699, "r_y2": 86.13611000000003, "r_x3": 168.50357, "r_y3": 86.13611000000003, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 357.3768, "t": 85.99707000000001, "r": 367.39523, "b": 90.95428000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.3768, "r_y0": 90.95428000000004, "r_x1": 367.39523, "r_y1": 90.95428000000004, "r_x2": 367.39523, "r_y2": 85.99707000000001, "r_x3": 357.3768, "r_y3": 85.99707000000001, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 333.73151, "t": 141.62323000000004, "r": 374.92862, "b": 146.58043999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73151, "r_y0": 146.58043999999995, "r_x1": 374.92862, "r_y1": 146.58043999999995, "r_x2": 374.92862, "r_y2": 141.62323000000004, "r_x3": 333.73151, "r_y3": 141.62323000000004, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 345.69101, "t": 86.05591000000004, "r": 355.70944, "b": 91.01312000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69101, "r_y0": 91.01312000000007, "r_x1": 355.70944, "r_y1": 91.01312000000007, "r_x2": 355.70944, "r_y2": 86.05591000000004, "r_x3": 345.69101, "r_y3": 86.05591000000004, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 508.54248, "t": 141.37683000000004, "r": 526.00592, "b": 146.33405000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54248, "r_y0": 146.33405000000005, "r_x1": 526.00592, "r_y1": 146.33405000000005, "r_x2": 526.00592, "r_y2": 141.37683000000004, "r_x3": 508.54248, "r_y3": 141.37683000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 510.44653000000005, "t": 86.09258999999986, "r": 523.70703, "b": 91.0498, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.44653000000005, "r_y0": 91.0498, "r_x1": 523.70703, "r_y1": 91.0498, "r_x2": 523.70703, "r_y2": 86.09258999999986, "r_x3": 510.44653000000005, "r_y3": 86.09258999999986, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 1, "label": "caption", "bbox": { "l": 50.112, "t": 165.50238000000002, "r": 545.11371, "b": 186.36395000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9661495685577393, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 174.40894000000003, "r_x1": 545.11371, "r_y1": 174.40894000000003, "r_x2": 545.11371, "r_y2": 165.50238000000002, "r_x3": 50.112, "r_y3": 165.50238000000002, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 186.36395000000005, "r_x1": 513.52234, "r_y1": 186.36395000000005, "r_x2": 513.52234, "r_y2": 177.4574, "r_x3": 50.112, "r_y3": 177.4574, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 61.569, "t": 210.93140000000005, "r": 286.36511, "b": 231.79296999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9621952772140503, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 219.83794999999998, "r_x1": 71.14743, "r_y1": 219.83794999999998, "r_x2": 71.14743, "r_y2": 210.93140000000005, "r_x3": 61.569, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.542038, "r_y0": 219.83794999999998, "r_x1": 286.36511, "r_y1": 219.83794999999998, "r_x2": 286.36511, "r_y2": 210.93140000000005, "r_x3": 73.542038, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 231.79296999999997, "r_x1": 87.47155, "r_y1": 231.79296999999997, "r_x2": 87.47155, "r_y2": 222.88640999999996, "r_x3": 70.037003, "r_y3": 222.88640999999996, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 61.569, "t": 244.07141000000001, "r": 286.36514, "b": 264.93298000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9629555344581604, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 252.97797000000003, "r_x1": 71.345718, "r_y1": 252.97797000000003, "r_x2": 71.345718, "r_y2": 244.07141000000001, "r_x3": 61.569, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.789902, "r_y0": 252.97797000000003, "r_x1": 286.36514, "r_y1": 252.97797000000003, "r_x2": 286.36514, "r_y2": 244.07141000000001, "r_x3": 73.789902, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 264.93298000000004, "r_x1": 150.41524, "r_y1": 264.93298000000004, "r_x2": 150.41524, "r_y2": 256.02643, "r_x3": 70.037003, "r_y3": 256.02643, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 50.112, "t": 279.20343, "r": 286.36511, "b": 395.70688, "coord_origin": "TOPLEFT" }, "confidence": 0.9767085909843445, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 288.10999, "r_x1": 286.36499, "r_y1": 288.10999, "r_x2": 286.36499, "r_y2": 279.20343, "r_x3": 62.067001, "r_y3": 279.20343, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.06497, "r_x1": 286.36505, "r_y1": 300.06497, "r_x2": 286.36505, "r_y2": 291.15842, "r_x3": 50.112, "r_y3": 291.15842, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.01996, "r_x1": 286.36511, "r_y1": 312.01996, "r_x2": 286.36511, "r_y2": 303.1134, "r_x3": 50.112, "r_y3": 303.1134, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 323.97495, "r_x1": 286.36511, "r_y1": 323.97495, "r_x2": 286.36511, "r_y2": 315.06839, "r_x3": 50.112, "r_y3": 315.06839, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 335.93093999999996, "r_x1": 286.36511, "r_y1": 335.93093999999996, "r_x2": 286.36511, "r_y2": 327.02438, "r_x3": 50.112, "r_y3": 327.02438, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 347.88593, "r_x1": 286.36505, "r_y1": 347.88593, "r_x2": 286.36505, "r_y2": 338.97937, "r_x3": 50.112, "r_y3": 338.97937, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.84091, "r_x1": 286.36508, "r_y1": 359.84091, "r_x2": 286.36508, "r_y2": 350.93436, "r_x3": 50.112, "r_y3": 350.93436, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.7959, "r_x1": 286.36511, "r_y1": 371.7959, "r_x2": 286.36511, "r_y2": 362.88934, "r_x3": 50.112, "r_y3": 362.88934, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 383.75089, "r_x1": 286.36508, "r_y1": 383.75089, "r_x2": 286.36508, "r_y2": 374.84433000000007, "r_x3": 50.112, "r_y3": 374.84433000000007, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 395.70688, "r_x1": 154.55988, "r_y1": 395.70688, "r_x2": 154.55988, "r_y2": 386.80032, "r_x3": 50.112, "r_y3": 386.80032, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 50.112, "t": 399.06934, "r": 286.36496, "b": 419.93188, "coord_origin": "TOPLEFT" }, "confidence": 0.934766411781311, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 407.97589, "r_x1": 286.36496, "r_y1": 407.97589, "r_x2": 286.36496, "r_y2": 399.06934, "r_x3": 62.067001, "r_y3": 399.06934, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 419.93188, "r_x1": 95.491638, "r_y1": 419.93188, "r_x2": 95.491638, "r_y2": 411.02533, "r_x3": 50.112, "r_y3": 411.02533, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "list_item", "bbox": { "l": 50.112, "t": 423.29532, "r": 286.36508, "b": 456.11185000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.8280702233314514, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 432.20187, "r_x1": 69.37281, "r_y1": 432.20187, "r_x2": 69.37281, "r_y2": 423.29532, "r_x3": 62.067001, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.808075, "r_y0": 432.20187, "r_x1": 286.36502, "r_y1": 432.20187, "r_x2": 286.36502, "r_y2": 423.29532, "r_x3": 71.808075, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 444.15686, "r_x1": 286.36508, "r_y1": 444.15686, "r_x2": 286.36508, "r_y2": 435.25031, "r_x3": 50.112, "r_y3": 435.25031, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 456.11185000000006, "r_x1": 274.50958, "r_y1": 456.11185000000006, "r_x2": 274.50958, "r_y2": 447.20529, "r_x3": 50.112, "r_y3": 447.20529, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 50.112, "t": 459.47528, "r": 286.36505, "b": 504.2468, "coord_origin": "TOPLEFT" }, "confidence": 0.9646760821342468, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 468.38184, "r_x1": 69.538948, "r_y1": 468.38184, "r_x2": 69.538948, "r_y2": 459.47528, "r_x3": 62.067001, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.429329, "r_y0": 468.38184, "r_x1": 286.36499, "r_y1": 468.38184, "r_x2": 286.36499, "r_y2": 459.47528, "r_x3": 77.429329, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 480.33682, "r_x1": 286.36505, "r_y1": 480.33682, "r_x2": 286.36505, "r_y2": 471.43027, "r_x3": 50.112, "r_y3": 471.43027, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.29181, "r_x1": 286.36505, "r_y1": 492.29181, "r_x2": 286.36505, "r_y2": 483.38525, "r_x3": 50.112, "r_y3": 483.38525, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 504.2468, "r_x1": 110.70452999999999, "r_y1": 504.2468, "r_x2": 110.70452999999999, "r_y2": 495.34024, "r_x3": 50.112, "r_y3": 495.34024, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 50.112, "t": 507.61023, "r": 286.36493, "b": 528.4727800000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9391399025917053, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 516.5167799999999, "r_x1": 69.863068, "r_y1": 516.5167799999999, "r_x2": 69.863068, "r_y2": 507.61023, "r_x3": 62.067001, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.461754, "r_y0": 516.5167799999999, "r_x1": 286.36493, "r_y1": 516.5167799999999, "r_x2": 286.36493, "r_y2": 507.61023, "r_x3": 72.461754, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 528.4727800000001, "r_x1": 226.0714, "r_y1": 528.4727800000001, "r_x2": 226.0714, "r_y2": 519.5662199999999, "r_x3": 50.112, "r_y3": 519.5662199999999, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 50.112, "t": 531.83521, "r": 286.36511, "b": 564.65277, "coord_origin": "TOPLEFT" }, "confidence": 0.9491708874702454, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 540.7417800000001, "r_x1": 286.36496, "r_y1": 540.7417800000001, "r_x2": 286.36496, "r_y2": 531.83521, "r_x3": 62.067001, "r_y3": 531.83521, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 552.69777, "r_x1": 286.36511, "r_y1": 552.69777, "r_x2": 286.36511, "r_y2": 543.79121, "r_x3": 50.112, "r_y3": 543.79121, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 564.65277, "r_x1": 114.03204, "r_y1": 564.65277, "r_x2": 114.03204, "r_y2": 555.74622, "r_x3": 50.112, "r_y3": 555.74622, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 50.112, "t": 568.01622, "r": 286.36508, "b": 600.83278, "coord_origin": "TOPLEFT" }, "confidence": 0.9587163329124451, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 576.92278, "r_x1": 69.538948, "r_y1": 576.92278, "r_x2": 69.538948, "r_y2": 568.01622, "r_x3": 62.067001, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.731949, "r_y0": 576.92278, "r_x1": 286.36502, "r_y1": 576.92278, "r_x2": 286.36502, "r_y2": 568.01622, "r_x3": 76.731949, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 588.87778, "r_x1": 286.36508, "r_y1": 588.87778, "r_x2": 286.36508, "r_y2": 579.97122, "r_x3": 50.112, "r_y3": 579.97122, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 600.83278, "r_x1": 278.70383, "r_y1": 600.83278, "r_x2": 278.70383, "r_y2": 591.9262200000001, "r_x3": 50.112, "r_y3": 591.9262200000001, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "formula", "bbox": { "l": 110.70499, "t": 623.43591, "r": 286.3624, "b": 654.1056100000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9298412799835205, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.02799999999999, "r_y0": 632.84061, "r_x1": 157.9516, "r_y1": 632.84061, "r_x2": 157.9516, "r_y2": 623.99382, "r_x3": 112.02799999999999, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.715, "r_y0": 632.84061, "r_x1": 203.4964, "r_y1": 632.84061, "r_x2": 203.4964, "r_y2": 623.99382, "r_x3": 160.715, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58499, "r_y0": 640.17578, "r_x1": 189.14511, "r_y1": 640.17578, "r_x2": 189.14511, "r_y2": 633.98305, "r_x3": 185.58499, "r_y3": 633.98305, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.49899, "r_y0": 632.84061, "r_x1": 208.48029, "r_y1": 632.84061, "r_x2": 208.48029, "r_y2": 623.43591, "r_x3": 203.49899, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48099, "r_y0": 632.84061, "r_x1": 220.28911, "r_y1": 632.84061, "r_x2": 220.28911, "r_y2": 623.99382, "r_x3": 208.48099, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.78699, "r_y0": 632.84061, "r_x1": 225.76828, "r_y1": 632.84061, "r_x2": 225.76828, "r_y2": 623.43591, "r_x3": 220.78699, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.70499, "r_y0": 654.1056100000001, "r_x1": 122.51310999999998, "r_y1": 654.1056100000001, "r_x2": 122.51310999999998, "r_y2": 645.25882, "r_x3": 110.70499, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.77899000000001, "r_y0": 654.1056100000001, "r_x1": 133.52791, "r_y1": 654.1056100000001, "r_x2": 133.52791, "r_y2": 645.25882, "r_x3": 125.77899000000001, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.295, "r_y0": 654.1056100000001, "r_x1": 156.00201, "r_y1": 654.1056100000001, "r_x2": 156.00201, "r_y2": 645.25882, "r_x3": 136.295, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.00299, "r_y0": 654.1056100000001, "r_x1": 160.98428, "r_y1": 654.1056100000001, "r_x2": 160.98428, "r_y2": 644.70091, "r_x3": 156.00299, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98399, "r_y0": 654.1056100000001, "r_x1": 170.23811, "r_y1": 654.1056100000001, "r_x2": 170.23811, "r_y2": 645.25882, "r_x3": 160.98399, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.73599, "r_y0": 654.1056100000001, "r_x1": 185.6779, "r_y1": 654.1056100000001, "r_x2": 185.6779, "r_y2": 644.70091, "r_x3": 170.73599, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.894, "r_y0": 654.1056100000001, "r_x1": 206.05283, "r_y1": 654.1056100000001, "r_x2": 206.05283, "r_y2": 645.25882, "r_x3": 187.894, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.054, "r_y0": 654.1056100000001, "r_x1": 211.03529, "r_y1": 654.1056100000001, "r_x2": 211.03529, "r_y2": 644.70091, "r_x3": 206.054, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.035, "r_y0": 654.1056100000001, "r_x1": 220.28912, "r_y1": 654.1056100000001, "r_x2": 220.28912, "r_y2": 645.25882, "r_x3": 211.035, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.787, "r_y0": 654.1056100000001, "r_x1": 225.76829999999998, "r_y1": 654.1056100000001, "r_x2": 225.76829999999998, "r_y2": 644.70091, "r_x3": 220.787, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 643.79178, "r_x1": 286.3624, "r_y1": 643.79178, "r_x2": 286.3624, "r_y2": 634.88522, "r_x3": 274.746, "r_y3": 634.88522, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 50.112, "t": 667.3479199999999, "r": 286.362, "b": 688.92679, "coord_origin": "TOPLEFT" }, "confidence": 0.9545555114746094, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 676.97179, "r_x1": 74.45063, "r_y1": 676.97179, "r_x2": 74.45063, "r_y2": 668.06522, "r_x3": 50.112, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.335999, "r_y0": 676.75261, "r_x1": 82.647812, "r_y1": 676.75261, "r_x2": 82.647812, "r_y2": 667.90582, "r_x3": 78.335999, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.532997, "r_y0": 676.97179, "r_x1": 123.63372, "r_y1": 676.97179, "r_x2": 123.63372, "r_y2": 668.06522, "r_x3": 86.532997, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.51899999999999, "r_y0": 676.75261, "r_x1": 132.50029, "r_y1": 676.75261, "r_x2": 132.50029, "r_y2": 667.3479199999999, "r_x3": 127.51899999999999, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.50099, "r_y0": 676.97179, "r_x1": 210.69743, "r_y1": 676.97179, "r_x2": 210.69743, "r_y2": 668.06522, "r_x3": 132.50099, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.69699, "r_y0": 676.75261, "r_x1": 215.67828, "r_y1": 676.75261, "r_x2": 215.67828, "r_y2": 667.3479199999999, "r_x3": 210.69699, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56299, "r_y0": 676.97179, "r_x1": 233.94897000000003, "r_y1": 676.97179, "r_x2": 233.94897000000003, "r_y2": 668.06522, "r_x3": 219.56299, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83499000000003, "r_y0": 676.75261, "r_x1": 247.08911, "r_y1": 676.75261, "r_x2": 247.08911, "r_y2": 667.90582, "r_x3": 237.83499000000003, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47299000000004, "r_y0": 676.97179, "r_x1": 286.362, "r_y1": 676.97179, "r_x2": 286.362, "r_y2": 668.06522, "r_x3": 251.47299000000004, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 688.92679, "r_x1": 205.88721, "r_y1": 688.92679, "r_x2": 205.88721, "r_y2": 680.02022, "r_x3": 50.112, "r_y3": 680.02022, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 50.112, "t": 692.290222, "r": 286.36496, "b": 713.151787, "coord_origin": "TOPLEFT" }, "confidence": 0.9260510206222534, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 701.196785, "r_x1": 69.538948, "r_y1": 701.196785, "r_x2": 69.538948, "r_y2": 692.290222, "r_x3": 62.067001, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.273666, "r_y0": 701.196785, "r_x1": 286.36496, "r_y1": 701.196785, "r_x2": 286.36496, "r_y2": 692.290222, "r_x3": 76.273666, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.151787, "r_x1": 94.604973, "r_y1": 713.151787, "r_x2": 94.604973, "r_y2": 704.245224, "r_x3": 50.112, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.598999, "r_y0": 712.93261, "r_x1": 103.29263, "r_y1": 712.93261, "r_x2": 103.29263, "r_y2": 704.085815, "r_x3": 97.598999, "r_y3": 704.085815, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.292, "r_y0": 713.151787, "r_x1": 286.36481, "r_y1": 713.151787, "r_x2": 286.36481, "r_y2": 704.245224, "r_x3": 103.292, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 308.862, "t": 210.93120999999996, "r": 545.11517, "b": 255.7038, "coord_origin": "TOPLEFT" }, "confidence": 0.8942298889160156, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 219.83776999999998, "r_x1": 545.11517, "r_y1": 219.83776999999998, "r_x2": 545.11517, "r_y2": 210.93120999999996, "r_x3": 308.862, "r_y3": 210.93120999999996, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 231.79376000000002, "r_x1": 545.11511, "r_y1": 231.79376000000002, "r_x2": 545.11511, "r_y2": 222.88720999999998, "r_x3": 308.862, "r_y3": 222.88720999999998, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 243.74878, "r_x1": 545.11511, "r_y1": 243.74878, "r_x2": 545.11511, "r_y2": 234.84222, "r_x3": 308.862, "r_y3": 234.84222, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 255.7038, "r_x1": 339.57669, "r_y1": 255.7038, "r_x2": 339.57669, "r_y2": 246.79724, "r_x3": 308.862, "r_y3": 246.79724, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 259.10222999999996, "r": 545.11499, "b": 279.96380999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9423392415046692, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 268.00879, "r_x1": 328.28894, "r_y1": 268.00879, "r_x2": 328.28894, "r_y2": 259.10222999999996, "r_x3": 320.81699, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88419, "r_y0": 268.00879, "r_x1": 545.11499, "r_y1": 268.00879, "r_x2": 545.11499, "r_y2": 259.10222999999996, "r_x3": 334.88419, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 279.96380999999997, "r_x1": 338.19189, "r_y1": 279.96380999999997, "r_x2": 338.19189, "r_y2": 271.05724999999995, "r_x3": 308.862, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68201, "r_y0": 279.74463000000003, "r_x1": 346.37564, "r_y1": 279.74463000000003, "r_x2": 346.37564, "r_y2": 270.89783, "r_x3": 340.68201, "r_y3": 270.89783, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37601, "r_y0": 279.96380999999997, "r_x1": 453.72305000000006, "r_y1": 279.96380999999997, "r_x2": 453.72305000000006, "r_y2": 271.05724999999995, "r_x3": 346.37601, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 308.86203, "t": 283.36325000000005, "r": 545.11511, "b": 387.91071, "coord_origin": "TOPLEFT" }, "confidence": 0.9562004804611206, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 292.26981, "r_x1": 328.38953, "r_y1": 292.26981, "r_x2": 328.38953, "r_y2": 283.36325000000005, "r_x3": 320.81702, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.9137, "r_y0": 292.26981, "r_x1": 545.11499, "r_y1": 292.26981, "r_x2": 545.11499, "r_y2": 283.36325000000005, "r_x3": 330.9137, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 304.22479, "r_x1": 545.11511, "r_y1": 304.22479, "r_x2": 545.11511, "r_y2": 295.31824, "r_x3": 308.86203, "r_y3": 295.31824, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 316.17978, "r_x1": 545.11505, "r_y1": 316.17978, "r_x2": 545.11505, "r_y2": 307.27322, "r_x3": 308.86203, "r_y3": 307.27322, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 328.13477, "r_x1": 545.11511, "r_y1": 328.13477, "r_x2": 545.11511, "r_y2": 319.22821000000005, "r_x3": 308.86203, "r_y3": 319.22821000000005, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 340.09076000000005, "r_x1": 397.19043, "r_y1": 340.09076000000005, "r_x2": 397.19043, "r_y2": 331.1842, "r_x3": 308.86203, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.65616, "r_y0": 340.09076000000005, "r_x1": 545.11511, "r_y1": 340.09076000000005, "r_x2": 545.11511, "r_y2": 331.1842, "r_x3": 403.65616, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 352.04575, "r_x1": 545.11511, "r_y1": 352.04575, "r_x2": 545.11511, "r_y2": 343.13919, "r_x3": 308.86203, "r_y3": 343.13919, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 364.00073, "r_x1": 545.11505, "r_y1": 364.00073, "r_x2": 545.11505, "r_y2": 355.09418, "r_x3": 308.86203, "r_y3": 355.09418, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 375.95572000000004, "r_x1": 545.11505, "r_y1": 375.95572000000004, "r_x2": 545.11505, "r_y2": 367.04916, "r_x3": 308.86203, "r_y3": 367.04916, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 387.91071, "r_x1": 329.61414, "r_y1": 387.91071, "r_x2": 329.61414, "r_y2": 379.00415, "r_x3": 308.86203, "r_y3": 379.00415, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "list_item", "bbox": { "l": 308.86203, "t": 391.31015, "r": 545.11517, "b": 459.99164, "coord_origin": "TOPLEFT" }, "confidence": 0.8719939589500427, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 400.2167099999999, "r_x1": 328.55356, "r_y1": 400.2167099999999, "r_x2": 328.55356, "r_y2": 391.31015, "r_x3": 320.81702, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13242, "r_y0": 400.2167099999999, "r_x1": 545.11505, "r_y1": 400.2167099999999, "r_x2": 545.11505, "r_y2": 391.31015, "r_x3": 331.13242, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 412.17169, "r_x1": 545.11517, "r_y1": 412.17169, "r_x2": 545.11517, "r_y2": 403.26514, "r_x3": 308.86203, "r_y3": 403.26514, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 424.12668, "r_x1": 545.11511, "r_y1": 424.12668, "r_x2": 545.11511, "r_y2": 415.22012000000007, "r_x3": 308.86203, "r_y3": 415.22012000000007, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 436.0816699999999, "r_x1": 545.11511, "r_y1": 436.0816699999999, "r_x2": 545.11511, "r_y2": 427.17511, "r_x3": 308.86203, "r_y3": 427.17511, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 448.03665, "r_x1": 545.11505, "r_y1": 448.03665, "r_x2": 545.11505, "r_y2": 439.1301, "r_x3": 308.86203, "r_y3": 439.1301, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 459.99164, "r_x1": 426.18161, "r_y1": 459.99164, "r_x2": 426.18161, "r_y2": 451.08507999999995, "r_x3": 308.86203, "r_y3": 451.08507999999995, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "list_item", "bbox": { "l": 308.86203, "t": 463.39108, "r": 545.11517, "b": 567.93858, "coord_origin": "TOPLEFT" }, "confidence": 0.9126082062721252, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 472.29764, "r_x1": 328.67316, "r_y1": 472.29764, "r_x2": 328.67316, "r_y2": 463.39108, "r_x3": 320.81702, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29187, "r_y0": 472.29764, "r_x1": 545.11499, "r_y1": 472.29764, "r_x2": 545.11499, "r_y2": 463.39108, "r_x3": 331.29187, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 484.25262, "r_x1": 545.11505, "r_y1": 484.25262, "r_x2": 545.11505, "r_y2": 475.34607, "r_x3": 308.86203, "r_y3": 475.34607, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 496.20761, "r_x1": 545.11517, "r_y1": 496.20761, "r_x2": 545.11517, "r_y2": 487.30106, "r_x3": 308.86203, "r_y3": 487.30106, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 508.1626, "r_x1": 381.89786, "r_y1": 508.1626, "r_x2": 381.89786, "r_y2": 499.25604, "r_x3": 308.86203, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7023, "r_y0": 508.1626, "r_x1": 545.11517, "r_y1": 508.1626, "r_x2": 545.11517, "r_y2": 499.25604, "r_x3": 388.7023, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 520.11859, "r_x1": 545.11511, "r_y1": 520.11859, "r_x2": 545.11511, "r_y2": 511.21204, "r_x3": 308.86203, "r_y3": 511.21204, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 532.07358, "r_x1": 545.11505, "r_y1": 532.07358, "r_x2": 545.11505, "r_y2": 523.16702, "r_x3": 308.86203, "r_y3": 523.16702, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 544.02858, "r_x1": 545.11499, "r_y1": 544.02858, "r_x2": 545.11499, "r_y2": 535.12201, "r_x3": 308.86203, "r_y3": 535.12201, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 555.98358, "r_x1": 545.11517, "r_y1": 555.98358, "r_x2": 545.11517, "r_y2": 547.07703, "r_x3": 308.86203, "r_y3": 547.07703, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 567.93858, "r_x1": 442.22147000000007, "r_y1": 567.93858, "r_x2": 442.22147000000007, "r_y2": 559.03203, "r_x3": 308.86203, "r_y3": 559.03203, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 308.86203, "t": 571.33803, "r": 545.11688, "b": 604.15459, "coord_origin": "TOPLEFT" }, "confidence": 0.8459473848342896, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 580.24458, "r_x1": 545.11493, "r_y1": 580.24458, "r_x2": 545.11493, "r_y2": 571.33803, "r_x3": 320.81702, "r_y3": 571.33803, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 592.19958, "r_x1": 471.64093, "r_y1": 592.19958, "r_x2": 471.64093, "r_y2": 583.29303, "r_x3": 308.86203, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83405, "r_y0": 591.98041, "r_x1": 479.71872, "r_y1": 591.98041, "r_x2": 479.71872, "r_y2": 583.1336200000001, "r_x3": 474.83405, "r_y3": 583.1336200000001, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.26903999999996, "r_y0": 592.19958, "r_x1": 545.11688, "r_y1": 592.19958, "r_x2": 545.11688, "r_y2": 583.29303, "r_x3": 483.26903999999996, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 604.15459, "r_x1": 329.91306, "r_y1": 604.15459, "r_x2": 329.91306, "r_y2": 595.24803, "r_x3": 308.86206, "r_y3": 595.24803, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "list_item", "bbox": { "l": 308.86206, "t": 607.55304, "r": 545.11505, "b": 628.4155900000001, "coord_origin": "TOPLEFT" }, "confidence": 0.7716891169548035, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 616.4595899999999, "r_x1": 332.8718, "r_y1": 616.4595899999999, "r_x2": 332.8718, "r_y2": 607.55304, "r_x3": 320.81705, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.92532, "r_y0": 616.4595899999999, "r_x1": 545.11505, "r_y1": 616.4595899999999, "r_x2": 545.11505, "r_y2": 607.55304, "r_x3": 339.92532, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 628.4155900000001, "r_x1": 495.2923, "r_y1": 628.4155900000001, "r_x2": 495.2923, "r_y2": 619.50903, "r_x3": 308.86206, "r_y3": 619.50903, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 308.86206, "t": 631.81403, "r": 545.11505, "b": 664.63059, "coord_origin": "TOPLEFT" }, "confidence": 0.8584907054901123, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 640.72058, "r_x1": 545.11505, "r_y1": 640.72058, "r_x2": 545.11505, "r_y2": 631.81403, "r_x3": 320.81705, "r_y3": 631.81403, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 652.67558, "r_x1": 455.28238, "r_y1": 652.67558, "r_x2": 455.28238, "r_y2": 643.7690299999999, "r_x3": 308.86206, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.77704, "r_y0": 652.45641, "r_x1": 463.47067, "r_y1": 652.45641, "r_x2": 463.47067, "r_y2": 643.60962, "r_x3": 457.77704, "r_y3": 643.60962, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97104, "r_y0": 652.67558, "r_x1": 545.11389, "r_y1": 652.67558, "r_x2": 545.11389, "r_y2": 643.7690299999999, "r_x3": 465.97104, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 664.63059, "r_x1": 332.38376, "r_y1": 664.63059, "r_x2": 332.38376, "r_y2": 655.72403, "r_x3": 308.86206, "r_y3": 655.72403, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "list_item", "bbox": { "l": 308.86206, "t": 668.03003, "r": 545.11499, "b": 688.89159, "coord_origin": "TOPLEFT" }, "confidence": 0.7590745091438293, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 676.93659, "r_x1": 545.11499, "r_y1": 676.93659, "r_x2": 545.11499, "r_y2": 668.03003, "r_x3": 320.81705, "r_y3": 668.03003, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 688.89159, "r_x1": 510.5848700000001, "r_y1": 688.89159, "r_x2": 510.5848700000001, "r_y2": 679.98503, "r_x3": 308.86206, "r_y3": 679.98503, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "list_item", "bbox": { "l": 308.86206, "t": 692.290024, "r": 545.11517, "b": 713.151596, "coord_origin": "TOPLEFT" }, "confidence": 0.6971189975738525, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 701.196594, "r_x1": 545.11505, "r_y1": 701.196594, "r_x2": 545.11505, "r_y2": 692.290024, "r_x3": 320.81705, "r_y3": 692.290024, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 713.151596, "r_x1": 545.11517, "r_y1": 713.151596, "r_x2": 545.11517, "r_y2": 704.245026, "r_x3": 308.86206, "r_y3": 704.245026, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_footer", "bbox": { "l": 292.63107, "t": 734.13303, "r": 302.59366, "b": 743.039593, "coord_origin": "TOPLEFT" }, "confidence": 0.9126598238945007, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63107, "r_y0": 743.039593, "r_x1": 302.59366, "r_y1": 743.039593, "r_x2": 302.59366, "r_y2": 734.13303, "r_x3": 292.63107, "r_y3": 734.13303, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "picture", "id": 30, "page_no": 11, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT" }, "confidence": 0.6033818125724792, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39108, "r_y0": 83.25922000000003, "r_x1": 151.94641, "r_y1": 83.25922000000003, "r_x2": 151.94641, "r_y2": 77.31055000000003, "r_x3": 119.39108, "r_y3": 77.31055000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.345978, "r_y0": 81.14020000000005, "r_x1": 59.327053, "r_y1": 81.14020000000005, "r_x2": 59.327053, "r_y2": 75.19152999999994, "r_x3": 53.345978, "r_y3": 75.19152999999994, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.5791, "r_y0": 83.40698000000009, "r_x1": 319.8266, "r_y1": 83.40698000000009, "r_x2": 319.8266, "r_y2": 77.45830999999998, "r_x3": 289.5791, "r_y3": 77.45830999999998, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37271, "r_y0": 83.20263999999997, "r_x1": 481.75916, "r_y1": 83.20263999999997, "r_x2": 481.75916, "r_y2": 77.25396999999987, "r_x3": 448.37271, "r_y3": 77.25396999999987, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.553436, "r_y0": 146.23339999999996, "r_x1": 94.976013, "r_y1": 146.23339999999996, "r_x2": 94.976013, "r_y2": 141.27617999999995, "r_x3": 82.553436, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.03878399999999, "r_y0": 106.06133999999986, "r_x1": 85.290085, "r_y1": 106.06133999999986, "r_x2": 85.290085, "r_y2": 101.10413000000005, "r_x3": 63.03878399999999, "r_y3": 101.10413000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.76786, "r_y0": 129.35253999999998, "r_x1": 85.231277, "r_y1": 129.35253999999998, "r_x2": 85.231277, "r_y2": 124.39531999999997, "r_x3": 67.76786, "r_y3": 124.39531999999997, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55121, "r_y0": 107.49712999999997, "r_x1": 249.80251, "r_y1": 107.49712999999997, "r_x2": 249.80251, "r_y2": 102.53992000000005, "r_x3": 227.55121, "r_y3": 102.53992000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.19898999999998, "r_y0": 131.94299, "r_x1": 249.66241, "r_y1": 131.94299, "r_x2": 249.66241, "r_y2": 126.98577999999986, "r_x3": 232.19898999999998, "r_y3": 126.98577999999986, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2337, "r_y0": 119.00243999999998, "r_x1": 413.69711, "r_y1": 119.00243999999998, "r_x2": 413.69711, "r_y2": 114.04522999999995, "r_x3": 396.2337, "r_y3": 114.04522999999995, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.382202, "r_y0": 146.23339999999996, "r_x1": 105.08014, "r_y1": 146.23339999999996, "r_x2": 105.08014, "r_y2": 141.27617999999995, "r_x3": 97.382202, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.93763400000001, "r_y0": 90.69042999999999, "r_x1": 76.151443, "r_y1": 90.69042999999999, "r_x2": 76.151443, "r_y2": 85.73321999999996, "r_x3": 60.93763400000001, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.304901, "r_y0": 91.18073000000015, "r_x1": 106.99162, "r_y1": 91.18073000000015, "r_x2": 106.99162, "r_y2": 86.22351000000003, "r_x3": 82.304901, "r_y3": 86.22351000000003, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.20530999999997, "r_y0": 146.56329000000005, "r_x1": 281.88013, "r_y1": 146.56329000000005, "r_x2": 281.88013, "r_y2": 141.60608000000002, "r_x3": 246.20530999999997, "r_y3": 141.60608000000002, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.69780000000003, "r_y0": 90.69042999999999, "r_x1": 241.91161, "r_y1": 90.69042999999999, "r_x2": 241.91161, "r_y2": 85.73321999999996, "r_x3": 226.69780000000003, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.93848999999997, "r_y0": 91.04522999999995, "r_x1": 282.49384, "r_y1": 91.04522999999995, "r_x2": 282.49384, "r_y2": 86.08801000000005, "r_x3": 249.93848999999997, "r_y3": 86.08801000000005, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19409, "r_y0": 146.23339999999996, "r_x1": 444.68915, "r_y1": 146.23339999999996, "r_x2": 444.68915, "r_y2": 141.27617999999995, "r_x3": 410.19409, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37341, "r_y0": 90.69042999999999, "r_x1": 432.6716599999999, "r_y1": 90.69042999999999, "r_x2": 432.6716599999999, "r_y2": 85.73321999999996, "r_x3": 391.37341, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.60571000000004, "r_y0": 91.21862999999996, "r_x1": 445.62414999999993, "r_y1": 91.21862999999996, "r_x2": 445.62414999999993, "r_y2": 86.26140999999996, "r_x3": 435.60571000000004, "r_y3": 86.26140999999996, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.94921, "r_y0": 146.24567000000002, "r_x1": 136.20052, "r_y1": 146.24567000000002, "r_x2": 136.20052, "r_y2": 141.28845, "r_x3": 113.94921, "r_y3": 141.28845, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.91554000000001, "r_y0": 99.77575999999999, "r_x1": 127.05433999999998, "r_y1": 99.77575999999999, "r_x2": 127.05433999999998, "r_y2": 94.81853999999998, "r_x3": 116.91554000000001, "r_y3": 94.81853999999998, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.3146, "r_y0": 105.89575000000002, "r_x1": 127.05298, "r_y1": 105.89575000000002, "r_x2": 127.05298, "r_y2": 100.93853999999999, "r_x3": 113.3146, "r_y3": 100.93853999999999, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94112, "r_y0": 112.01575000000003, "r_x1": 127.05537, "r_y1": 112.01575000000003, "r_x2": 127.05537, "r_y2": 107.05853000000013, "r_x3": 112.94112, "r_y3": 107.05853000000013, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.22738999999999, "r_y0": 127.57245, "r_x1": 126.96577, "r_y1": 127.57245, "r_x2": 126.96577, "r_y2": 122.61523, "r_x3": 113.22738999999999, "r_y3": 122.61523, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85390000000001, "r_y0": 133.69244000000003, "r_x1": 126.96814999999998, "r_y1": 133.69244000000003, "r_x2": 126.96814999999998, "r_y2": 128.73523, "r_x3": 112.85390000000001, "r_y3": 128.73523, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.57864, "r_y0": 146.39362000000006, "r_x1": 156.04207, "r_y1": 146.39362000000006, "r_x2": 156.04207, "r_y2": 141.43640000000005, "r_x3": 138.57864, "r_y3": 141.43640000000005, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03101, "r_y0": 91.22852, "r_x1": 151.04185, "r_y1": 91.22852, "r_x2": 151.04185, "r_y2": 86.2713, "r_x3": 122.03101, "r_y3": 86.2713, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65359, "r_y0": 91.5122100000001, "r_x1": 321.67203, "r_y1": 91.5122100000001, "r_x2": 321.67203, "r_y2": 86.55498999999998, "r_x3": 311.65359, "r_y3": 86.55498999999998, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89441, "r_y0": 146.66785000000004, "r_x1": 310.14572, "r_y1": 146.66785000000004, "r_x2": 310.14572, "r_y2": 141.71063000000004, "r_x3": 287.89441, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.23572, "r_y0": 98.03698999999995, "r_x1": 299.37451, "r_y1": 98.03698999999995, "r_x2": 299.37451, "r_y2": 93.07977000000005, "r_x3": 289.23572, "r_y3": 93.07977000000005, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63513, "r_y0": 104.15698000000009, "r_x1": 299.3735, "r_y1": 104.15698000000009, "r_x2": 299.3735, "r_y2": 99.19976999999994, "r_x3": 285.63513, "r_y3": 99.19976999999994, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26111, "r_y0": 110.27697999999998, "r_x1": 299.37537, "r_y1": 110.27697999999998, "r_x2": 299.37537, "r_y2": 105.31975999999997, "r_x3": 285.26111, "r_y3": 105.31975999999997, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43109, "r_y0": 125.34717, "r_x1": 299.16946, "r_y1": 125.34717, "r_x2": 299.16946, "r_y2": 120.38995, "r_x3": 285.43109, "r_y3": 120.38995, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.05713, "r_y0": 131.46716000000004, "r_x1": 299.17139, "r_y1": 131.46716000000004, "r_x2": 299.17139, "r_y2": 126.50995, "r_x3": 285.05713, "r_y3": 126.50995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.34592, "r_y0": 146.66785000000004, "r_x1": 328.80933, "r_y1": 146.66785000000004, "r_x2": 328.80933, "r_y2": 141.71063000000004, "r_x3": 311.34592, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58362, "r_y0": 91.65075999999999, "r_x1": 309.60205, "r_y1": 91.65075999999999, "r_x2": 309.60205, "r_y2": 86.69353999999998, "r_x3": 299.58362, "r_y3": 86.69353999999998, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04077000000007, "r_y0": 146.62891000000002, "r_x1": 483.50418, "r_y1": 146.62891000000002, "r_x2": 483.50418, "r_y2": 141.67169, "r_x3": 466.04077000000007, "r_y3": 141.67169, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02151, "r_y0": 98.71838000000002, "r_x1": 469.16031000000004, "r_y1": 98.71838000000002, "r_x2": 469.16031000000004, "r_y2": 93.76116999999999, "r_x3": 459.02151, "r_y3": 93.76116999999999, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.4209, "r_y0": 104.83838000000003, "r_x1": 469.15927000000005, "r_y1": 104.83838000000003, "r_x2": 469.15927000000005, "r_y2": 99.88116000000002, "r_x3": 455.4209, "r_y3": 99.88116000000002, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.04691, "r_y0": 110.95836999999995, "r_x1": 469.16115999999994, "r_y1": 110.95836999999995, "r_x2": 469.16115999999994, "r_y2": 106.00116000000014, "r_x3": 455.04691, "r_y3": 106.00116000000014, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39401, "r_y0": 90.52959999999996, "r_x1": 480.6545100000001, "r_y1": 90.52959999999996, "r_x2": 480.6545100000001, "r_y2": 85.57239000000004, "r_x3": 467.39401, "r_y3": 85.57239000000004, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37672, "r_y0": 146.54107999999997, "r_x1": 182.62802, "r_y1": 146.54107999999997, "r_x2": 182.62802, "r_y2": 141.58385999999996, "r_x3": 160.37672, "r_y3": 141.58385999999996, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74265, "r_y0": 99.82201999999995, "r_x1": 173.32664, "r_y1": 99.82201999999995, "r_x2": 173.32664, "r_y2": 94.86481000000003, "r_x3": 153.74265, "r_y3": 94.86481000000003, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50967, "r_y0": 105.94202000000007, "r_x1": 173.3246, "r_y1": 105.94202000000007, "r_x2": 173.3246, "r_y2": 100.98479999999995, "r_x3": 154.50967, "r_y3": 100.98479999999995, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27162, "r_y0": 112.06200999999987, "r_x1": 173.32664, "r_y1": 112.06200999999987, "r_x2": 173.32664, "r_y2": 107.10479999999995, "r_x3": 155.27162, "r_y3": 107.10479999999995, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41302, "r_y0": 112.18970000000002, "r_x1": 345.99701, "r_y1": 112.18970000000002, "r_x2": 345.99701, "r_y2": 107.23248000000001, "r_x3": 326.41302, "r_y3": 107.23248000000001, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.17972, "r_y0": 118.30969000000005, "r_x1": 345.99463, "r_y1": 118.30969000000005, "r_x2": 345.99463, "r_y2": 113.35248000000001, "r_x3": 327.17972, "r_y3": 113.35248000000001, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94131, "r_y0": 124.42969000000005, "r_x1": 345.99634, "r_y1": 124.42969000000005, "r_x2": 345.99634, "r_y2": 119.47247000000004, "r_x3": 327.94131, "r_y3": 119.47247000000004, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.9942, "r_y0": 109.11095999999998, "r_x1": 508.76384999999993, "r_y1": 109.11095999999998, "r_x2": 508.76384999999993, "r_y2": 104.15374999999983, "r_x3": 488.9942, "r_y3": 104.15374999999983, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.1893, "r_y0": 115.2309600000001, "r_x1": 508.76349000000005, "r_y1": 115.2309600000001, "r_x2": 508.76349000000005, "r_y2": 110.27373999999998, "r_x3": 490.1893, "r_y3": 110.27373999999998, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72009, "r_y0": 121.35095000000013, "r_x1": 508.76758, "r_y1": 121.35095000000013, "r_x2": 508.76758, "r_y2": 116.39373999999998, "r_x3": 489.72009, "r_y3": 116.39373999999998, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71121, "r_y0": 127.47095000000002, "r_x1": 508.76624, "r_y1": 127.47095000000002, "r_x2": 508.76624, "r_y2": 122.51373000000001, "r_x3": 490.71121, "r_y3": 122.51373000000001, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.37759, "r_y0": 146.66840000000002, "r_x1": 202.84102, "r_y1": 146.66840000000002, "r_x2": 202.84102, "r_y2": 141.71118, "r_x3": 185.37759, "r_y3": 141.71118, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.50357, "r_y0": 91.09331999999995, "r_x1": 197.52699, "r_y1": 91.09331999999995, "r_x2": 197.52699, "r_y2": 86.13611000000003, "r_x3": 168.50357, "r_y3": 86.13611000000003, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.3768, "r_y0": 90.95428000000004, "r_x1": 367.39523, "r_y1": 90.95428000000004, "r_x2": 367.39523, "r_y2": 85.99707000000001, "r_x3": 357.3768, "r_y3": 85.99707000000001, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73151, "r_y0": 146.58043999999995, "r_x1": 374.92862, "r_y1": 146.58043999999995, "r_x2": 374.92862, "r_y2": 141.62323000000004, "r_x3": 333.73151, "r_y3": 141.62323000000004, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69101, "r_y0": 91.01312000000007, "r_x1": 355.70944, "r_y1": 91.01312000000007, "r_x2": 355.70944, "r_y2": 86.05591000000004, "r_x3": 345.69101, "r_y3": 86.05591000000004, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54248, "r_y0": 146.33405000000005, "r_x1": 526.00592, "r_y1": 146.33405000000005, "r_x2": 526.00592, "r_y2": 141.37683000000004, "r_x3": 508.54248, "r_y3": 141.37683000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.44653000000005, "r_y0": 91.0498, "r_x1": 523.70703, "r_y1": 91.0498, "r_x2": 523.70703, "r_y2": 86.09258999999986, "r_x3": 510.44653000000005, "r_y3": 86.09258999999986, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 46, "label": "text", "bbox": { "l": 119.39108, "t": 77.31055000000003, "r": 151.94641, "b": 83.25922000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39108, "r_y0": 83.25922000000003, "r_x1": 151.94641, "r_y1": 83.25922000000003, "r_x2": 151.94641, "r_y2": 77.31055000000003, "r_x3": 119.39108, "r_y3": 77.31055000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 53.345978, "t": 75.19152999999994, "r": 59.327053, "b": 81.14020000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.345978, "r_y0": 81.14020000000005, "r_x1": 59.327053, "r_y1": 81.14020000000005, "r_x2": 59.327053, "r_y2": 75.19152999999994, "r_x3": 53.345978, "r_y3": 75.19152999999994, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 289.5791, "t": 77.45830999999998, "r": 319.8266, "b": 83.40698000000009, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.5791, "r_y0": 83.40698000000009, "r_x1": 319.8266, "r_y1": 83.40698000000009, "r_x2": 319.8266, "r_y2": 77.45830999999998, "r_x3": 289.5791, "r_y3": 77.45830999999998, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 448.37271, "t": 77.25396999999987, "r": 481.75916, "b": 83.20263999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37271, "r_y0": 83.20263999999997, "r_x1": 481.75916, "r_y1": 83.20263999999997, "r_x2": 481.75916, "r_y2": 77.25396999999987, "r_x3": 448.37271, "r_y3": 77.25396999999987, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 82.553436, "t": 141.27617999999995, "r": 94.976013, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.553436, "r_y0": 146.23339999999996, "r_x1": 94.976013, "r_y1": 146.23339999999996, "r_x2": 94.976013, "r_y2": 141.27617999999995, "r_x3": 82.553436, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 63.03878399999999, "t": 101.10413000000005, "r": 85.290085, "b": 106.06133999999986, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.03878399999999, "r_y0": 106.06133999999986, "r_x1": 85.290085, "r_y1": 106.06133999999986, "r_x2": 85.290085, "r_y2": 101.10413000000005, "r_x3": 63.03878399999999, "r_y3": 101.10413000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 67.76786, "t": 124.39531999999997, "r": 85.231277, "b": 129.35253999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.76786, "r_y0": 129.35253999999998, "r_x1": 85.231277, "r_y1": 129.35253999999998, "r_x2": 85.231277, "r_y2": 124.39531999999997, "r_x3": 67.76786, "r_y3": 124.39531999999997, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 227.55121, "t": 102.53992000000005, "r": 249.80251, "b": 107.49712999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55121, "r_y0": 107.49712999999997, "r_x1": 249.80251, "r_y1": 107.49712999999997, "r_x2": 249.80251, "r_y2": 102.53992000000005, "r_x3": 227.55121, "r_y3": 102.53992000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 232.19898999999998, "t": 126.98577999999986, "r": 249.66241, "b": 131.94299, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.19898999999998, "r_y0": 131.94299, "r_x1": 249.66241, "r_y1": 131.94299, "r_x2": 249.66241, "r_y2": 126.98577999999986, "r_x3": 232.19898999999998, "r_y3": 126.98577999999986, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 396.2337, "t": 114.04522999999995, "r": 413.69711, "b": 119.00243999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2337, "r_y0": 119.00243999999998, "r_x1": 413.69711, "r_y1": 119.00243999999998, "r_x2": 413.69711, "r_y2": 114.04522999999995, "r_x3": 396.2337, "r_y3": 114.04522999999995, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 97.382202, "t": 141.27617999999995, "r": 105.08014, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.382202, "r_y0": 146.23339999999996, "r_x1": 105.08014, "r_y1": 146.23339999999996, "r_x2": 105.08014, "r_y2": 141.27617999999995, "r_x3": 97.382202, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 60.93763400000001, "t": 85.73321999999996, "r": 76.151443, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.93763400000001, "r_y0": 90.69042999999999, "r_x1": 76.151443, "r_y1": 90.69042999999999, "r_x2": 76.151443, "r_y2": 85.73321999999996, "r_x3": 60.93763400000001, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 82.304901, "t": 86.22351000000003, "r": 106.99162, "b": 91.18073000000015, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.304901, "r_y0": 91.18073000000015, "r_x1": 106.99162, "r_y1": 91.18073000000015, "r_x2": 106.99162, "r_y2": 86.22351000000003, "r_x3": 82.304901, "r_y3": 86.22351000000003, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 246.20530999999997, "t": 141.60608000000002, "r": 281.88013, "b": 146.56329000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.20530999999997, "r_y0": 146.56329000000005, "r_x1": 281.88013, "r_y1": 146.56329000000005, "r_x2": 281.88013, "r_y2": 141.60608000000002, "r_x3": 246.20530999999997, "r_y3": 141.60608000000002, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 226.69780000000003, "t": 85.73321999999996, "r": 241.91161, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.69780000000003, "r_y0": 90.69042999999999, "r_x1": 241.91161, "r_y1": 90.69042999999999, "r_x2": 241.91161, "r_y2": 85.73321999999996, "r_x3": 226.69780000000003, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 249.93848999999997, "t": 86.08801000000005, "r": 282.49384, "b": 91.04522999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.93848999999997, "r_y0": 91.04522999999995, "r_x1": 282.49384, "r_y1": 91.04522999999995, "r_x2": 282.49384, "r_y2": 86.08801000000005, "r_x3": 249.93848999999997, "r_y3": 86.08801000000005, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 410.19409, "t": 141.27617999999995, "r": 444.68915, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19409, "r_y0": 146.23339999999996, "r_x1": 444.68915, "r_y1": 146.23339999999996, "r_x2": 444.68915, "r_y2": 141.27617999999995, "r_x3": 410.19409, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 391.37341, "t": 85.73321999999996, "r": 432.6716599999999, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37341, "r_y0": 90.69042999999999, "r_x1": 432.6716599999999, "r_y1": 90.69042999999999, "r_x2": 432.6716599999999, "r_y2": 85.73321999999996, "r_x3": 391.37341, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 435.60571000000004, "t": 86.26140999999996, "r": 445.62414999999993, "b": 91.21862999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.60571000000004, "r_y0": 91.21862999999996, "r_x1": 445.62414999999993, "r_y1": 91.21862999999996, "r_x2": 445.62414999999993, "r_y2": 86.26140999999996, "r_x3": 435.60571000000004, "r_y3": 86.26140999999996, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 113.94921, "t": 141.28845, "r": 136.20052, "b": 146.24567000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.94921, "r_y0": 146.24567000000002, "r_x1": 136.20052, "r_y1": 146.24567000000002, "r_x2": 136.20052, "r_y2": 141.28845, "r_x3": 113.94921, "r_y3": 141.28845, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 116.91554000000001, "t": 94.81853999999998, "r": 127.05433999999998, "b": 99.77575999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.91554000000001, "r_y0": 99.77575999999999, "r_x1": 127.05433999999998, "r_y1": 99.77575999999999, "r_x2": 127.05433999999998, "r_y2": 94.81853999999998, "r_x3": 116.91554000000001, "r_y3": 94.81853999999998, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 113.3146, "t": 100.93853999999999, "r": 127.05298, "b": 105.89575000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.3146, "r_y0": 105.89575000000002, "r_x1": 127.05298, "r_y1": 105.89575000000002, "r_x2": 127.05298, "r_y2": 100.93853999999999, "r_x3": 113.3146, "r_y3": 100.93853999999999, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 112.94112, "t": 107.05853000000013, "r": 127.05537, "b": 112.01575000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94112, "r_y0": 112.01575000000003, "r_x1": 127.05537, "r_y1": 112.01575000000003, "r_x2": 127.05537, "r_y2": 107.05853000000013, "r_x3": 112.94112, "r_y3": 107.05853000000013, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 113.22738999999999, "t": 122.61523, "r": 126.96577, "b": 127.57245, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.22738999999999, "r_y0": 127.57245, "r_x1": 126.96577, "r_y1": 127.57245, "r_x2": 126.96577, "r_y2": 122.61523, "r_x3": 113.22738999999999, "r_y3": 122.61523, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 112.85390000000001, "t": 128.73523, "r": 126.96814999999998, "b": 133.69244000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85390000000001, "r_y0": 133.69244000000003, "r_x1": 126.96814999999998, "r_y1": 133.69244000000003, "r_x2": 126.96814999999998, "r_y2": 128.73523, "r_x3": 112.85390000000001, "r_y3": 128.73523, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 138.57864, "t": 141.43640000000005, "r": 156.04207, "b": 146.39362000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.57864, "r_y0": 146.39362000000006, "r_x1": 156.04207, "r_y1": 146.39362000000006, "r_x2": 156.04207, "r_y2": 141.43640000000005, "r_x3": 138.57864, "r_y3": 141.43640000000005, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 122.03101, "t": 86.2713, "r": 151.04185, "b": 91.22852, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03101, "r_y0": 91.22852, "r_x1": 151.04185, "r_y1": 91.22852, "r_x2": 151.04185, "r_y2": 86.2713, "r_x3": 122.03101, "r_y3": 86.2713, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 311.65359, "t": 86.55498999999998, "r": 321.67203, "b": 91.5122100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65359, "r_y0": 91.5122100000001, "r_x1": 321.67203, "r_y1": 91.5122100000001, "r_x2": 321.67203, "r_y2": 86.55498999999998, "r_x3": 311.65359, "r_y3": 86.55498999999998, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 287.89441, "t": 141.71063000000004, "r": 310.14572, "b": 146.66785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89441, "r_y0": 146.66785000000004, "r_x1": 310.14572, "r_y1": 146.66785000000004, "r_x2": 310.14572, "r_y2": 141.71063000000004, "r_x3": 287.89441, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.23572, "t": 93.07977000000005, "r": 299.37451, "b": 98.03698999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.23572, "r_y0": 98.03698999999995, "r_x1": 299.37451, "r_y1": 98.03698999999995, "r_x2": 299.37451, "r_y2": 93.07977000000005, "r_x3": 289.23572, "r_y3": 93.07977000000005, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 285.63513, "t": 99.19976999999994, "r": 299.3735, "b": 104.15698000000009, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63513, "r_y0": 104.15698000000009, "r_x1": 299.3735, "r_y1": 104.15698000000009, "r_x2": 299.3735, "r_y2": 99.19976999999994, "r_x3": 285.63513, "r_y3": 99.19976999999994, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 285.26111, "t": 105.31975999999997, "r": 299.37537, "b": 110.27697999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26111, "r_y0": 110.27697999999998, "r_x1": 299.37537, "r_y1": 110.27697999999998, "r_x2": 299.37537, "r_y2": 105.31975999999997, "r_x3": 285.26111, "r_y3": 105.31975999999997, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 285.43109, "t": 120.38995, "r": 299.16946, "b": 125.34717, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43109, "r_y0": 125.34717, "r_x1": 299.16946, "r_y1": 125.34717, "r_x2": 299.16946, "r_y2": 120.38995, "r_x3": 285.43109, "r_y3": 120.38995, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 285.05713, "t": 126.50995, "r": 299.17139, "b": 131.46716000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.05713, "r_y0": 131.46716000000004, "r_x1": 299.17139, "r_y1": 131.46716000000004, "r_x2": 299.17139, "r_y2": 126.50995, "r_x3": 285.05713, "r_y3": 126.50995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 311.34592, "t": 141.71063000000004, "r": 328.80933, "b": 146.66785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.34592, "r_y0": 146.66785000000004, "r_x1": 328.80933, "r_y1": 146.66785000000004, "r_x2": 328.80933, "r_y2": 141.71063000000004, "r_x3": 311.34592, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 299.58362, "t": 86.69353999999998, "r": 309.60205, "b": 91.65075999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58362, "r_y0": 91.65075999999999, "r_x1": 309.60205, "r_y1": 91.65075999999999, "r_x2": 309.60205, "r_y2": 86.69353999999998, "r_x3": 299.58362, "r_y3": 86.69353999999998, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 466.04077000000007, "t": 141.67169, "r": 483.50418, "b": 146.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04077000000007, "r_y0": 146.62891000000002, "r_x1": 483.50418, "r_y1": 146.62891000000002, "r_x2": 483.50418, "r_y2": 141.67169, "r_x3": 466.04077000000007, "r_y3": 141.67169, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 459.02151, "t": 93.76116999999999, "r": 469.16031000000004, "b": 98.71838000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02151, "r_y0": 98.71838000000002, "r_x1": 469.16031000000004, "r_y1": 98.71838000000002, "r_x2": 469.16031000000004, "r_y2": 93.76116999999999, "r_x3": 459.02151, "r_y3": 93.76116999999999, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 455.4209, "t": 99.88116000000002, "r": 469.15927000000005, "b": 104.83838000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.4209, "r_y0": 104.83838000000003, "r_x1": 469.15927000000005, "r_y1": 104.83838000000003, "r_x2": 469.15927000000005, "r_y2": 99.88116000000002, "r_x3": 455.4209, "r_y3": 99.88116000000002, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 455.04691, "t": 106.00116000000014, "r": 469.16115999999994, "b": 110.95836999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.04691, "r_y0": 110.95836999999995, "r_x1": 469.16115999999994, "r_y1": 110.95836999999995, "r_x2": 469.16115999999994, "r_y2": 106.00116000000014, "r_x3": 455.04691, "r_y3": 106.00116000000014, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 467.39401, "t": 85.57239000000004, "r": 480.6545100000001, "b": 90.52959999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39401, "r_y0": 90.52959999999996, "r_x1": 480.6545100000001, "r_y1": 90.52959999999996, "r_x2": 480.6545100000001, "r_y2": 85.57239000000004, "r_x3": 467.39401, "r_y3": 85.57239000000004, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 160.37672, "t": 141.58385999999996, "r": 182.62802, "b": 146.54107999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37672, "r_y0": 146.54107999999997, "r_x1": 182.62802, "r_y1": 146.54107999999997, "r_x2": 182.62802, "r_y2": 141.58385999999996, "r_x3": 160.37672, "r_y3": 141.58385999999996, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 153.74265, "t": 94.86481000000003, "r": 173.32664, "b": 99.82201999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74265, "r_y0": 99.82201999999995, "r_x1": 173.32664, "r_y1": 99.82201999999995, "r_x2": 173.32664, "r_y2": 94.86481000000003, "r_x3": 153.74265, "r_y3": 94.86481000000003, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 154.50967, "t": 100.98479999999995, "r": 173.3246, "b": 105.94202000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50967, "r_y0": 105.94202000000007, "r_x1": 173.3246, "r_y1": 105.94202000000007, "r_x2": 173.3246, "r_y2": 100.98479999999995, "r_x3": 154.50967, "r_y3": 100.98479999999995, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 155.27162, "t": 107.10479999999995, "r": 173.32664, "b": 112.06200999999987, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27162, "r_y0": 112.06200999999987, "r_x1": 173.32664, "r_y1": 112.06200999999987, "r_x2": 173.32664, "r_y2": 107.10479999999995, "r_x3": 155.27162, "r_y3": 107.10479999999995, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.41302, "t": 107.23248000000001, "r": 345.99701, "b": 112.18970000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41302, "r_y0": 112.18970000000002, "r_x1": 345.99701, "r_y1": 112.18970000000002, "r_x2": 345.99701, "r_y2": 107.23248000000001, "r_x3": 326.41302, "r_y3": 107.23248000000001, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 327.17972, "t": 113.35248000000001, "r": 345.99463, "b": 118.30969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.17972, "r_y0": 118.30969000000005, "r_x1": 345.99463, "r_y1": 118.30969000000005, "r_x2": 345.99463, "r_y2": 113.35248000000001, "r_x3": 327.17972, "r_y3": 113.35248000000001, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 327.94131, "t": 119.47247000000004, "r": 345.99634, "b": 124.42969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94131, "r_y0": 124.42969000000005, "r_x1": 345.99634, "r_y1": 124.42969000000005, "r_x2": 345.99634, "r_y2": 119.47247000000004, "r_x3": 327.94131, "r_y3": 119.47247000000004, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 488.9942, "t": 104.15374999999983, "r": 508.76384999999993, "b": 109.11095999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.9942, "r_y0": 109.11095999999998, "r_x1": 508.76384999999993, "r_y1": 109.11095999999998, "r_x2": 508.76384999999993, "r_y2": 104.15374999999983, "r_x3": 488.9942, "r_y3": 104.15374999999983, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 490.1893, "t": 110.27373999999998, "r": 508.76349000000005, "b": 115.2309600000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.1893, "r_y0": 115.2309600000001, "r_x1": 508.76349000000005, "r_y1": 115.2309600000001, "r_x2": 508.76349000000005, "r_y2": 110.27373999999998, "r_x3": 490.1893, "r_y3": 110.27373999999998, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 489.72009, "t": 116.39373999999998, "r": 508.76758, "b": 121.35095000000013, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72009, "r_y0": 121.35095000000013, "r_x1": 508.76758, "r_y1": 121.35095000000013, "r_x2": 508.76758, "r_y2": 116.39373999999998, "r_x3": 489.72009, "r_y3": 116.39373999999998, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 490.71121, "t": 122.51373000000001, "r": 508.76624, "b": 127.47095000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71121, "r_y0": 127.47095000000002, "r_x1": 508.76624, "r_y1": 127.47095000000002, "r_x2": 508.76624, "r_y2": 122.51373000000001, "r_x3": 490.71121, "r_y3": 122.51373000000001, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 185.37759, "t": 141.71118, "r": 202.84102, "b": 146.66840000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.37759, "r_y0": 146.66840000000002, "r_x1": 202.84102, "r_y1": 146.66840000000002, "r_x2": 202.84102, "r_y2": 141.71118, "r_x3": 185.37759, "r_y3": 141.71118, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 168.50357, "t": 86.13611000000003, "r": 197.52699, "b": 91.09331999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.50357, "r_y0": 91.09331999999995, "r_x1": 197.52699, "r_y1": 91.09331999999995, "r_x2": 197.52699, "r_y2": 86.13611000000003, "r_x3": 168.50357, "r_y3": 86.13611000000003, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 357.3768, "t": 85.99707000000001, "r": 367.39523, "b": 90.95428000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.3768, "r_y0": 90.95428000000004, "r_x1": 367.39523, "r_y1": 90.95428000000004, "r_x2": 367.39523, "r_y2": 85.99707000000001, "r_x3": 357.3768, "r_y3": 85.99707000000001, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 333.73151, "t": 141.62323000000004, "r": 374.92862, "b": 146.58043999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73151, "r_y0": 146.58043999999995, "r_x1": 374.92862, "r_y1": 146.58043999999995, "r_x2": 374.92862, "r_y2": 141.62323000000004, "r_x3": 333.73151, "r_y3": 141.62323000000004, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 345.69101, "t": 86.05591000000004, "r": 355.70944, "b": 91.01312000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69101, "r_y0": 91.01312000000007, "r_x1": 355.70944, "r_y1": 91.01312000000007, "r_x2": 355.70944, "r_y2": 86.05591000000004, "r_x3": 345.69101, "r_y3": 86.05591000000004, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 508.54248, "t": 141.37683000000004, "r": 526.00592, "b": 146.33405000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54248, "r_y0": 146.33405000000005, "r_x1": 526.00592, "r_y1": 146.33405000000005, "r_x2": 526.00592, "r_y2": 141.37683000000004, "r_x3": 508.54248, "r_y3": 141.37683000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 510.44653000000005, "t": 86.09258999999986, "r": 523.70703, "b": 91.0498, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.44653000000005, "r_y0": 91.0498, "r_x1": 523.70703, "r_y1": 91.0498, "r_x2": 523.70703, "r_y2": 86.09258999999986, "r_x3": 510.44653000000005, "r_y3": 86.09258999999986, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 50.112, "t": 165.50238000000002, "r": 545.11371, "b": 186.36395000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9661495685577393, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 174.40894000000003, "r_x1": 545.11371, "r_y1": 174.40894000000003, "r_x2": 545.11371, "r_y2": 165.50238000000002, "r_x3": 50.112, "r_y3": 165.50238000000002, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 186.36395000000005, "r_x1": 513.52234, "r_y1": 186.36395000000005, "r_x2": 513.52234, "r_y2": 177.4574, "r_x3": 50.112, "r_y3": 177.4574, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity." }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 61.569, "t": 210.93140000000005, "r": 286.36511, "b": 231.79296999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9621952772140503, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 219.83794999999998, "r_x1": 71.14743, "r_y1": 219.83794999999998, "r_x2": 71.14743, "r_y2": 210.93140000000005, "r_x3": 61.569, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.542038, "r_y0": 219.83794999999998, "r_x1": 286.36511, "r_y1": 219.83794999999998, "r_x2": 286.36511, "r_y2": 210.93140000000005, "r_x3": 73.542038, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 231.79296999999997, "r_x1": 87.47155, "r_y1": 231.79296999999997, "r_x2": 87.47155, "r_y2": 222.88640999999996, "r_x3": 70.037003, "r_y3": 222.88640999999996, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 TableFormer output does not include the table cell content." }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 61.569, "t": 244.07141000000001, "r": 286.36514, "b": 264.93298000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9629555344581604, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 252.97797000000003, "r_x1": 71.345718, "r_y1": 252.97797000000003, "r_x2": 71.345718, "r_y2": 244.07141000000001, "r_x3": 61.569, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.789902, "r_y0": 252.97797000000003, "r_x1": 286.36514, "r_y1": 252.97797000000003, "r_x2": 286.36514, "r_y2": 244.07141000000001, "r_x3": 73.789902, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 264.93298000000004, "r_x1": 150.41524, "r_y1": 264.93298000000004, "r_x2": 150.41524, "r_y2": 256.02643, "r_x3": 70.037003, "r_y3": 256.02643, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.112, "t": 279.20343, "r": 286.36511, "b": 395.70688, "coord_origin": "TOPLEFT" }, "confidence": 0.9767085909843445, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 288.10999, "r_x1": 286.36499, "r_y1": 288.10999, "r_x2": 286.36499, "r_y2": 279.20343, "r_x3": 62.067001, "r_y3": 279.20343, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.06497, "r_x1": 286.36505, "r_y1": 300.06497, "r_x2": 286.36505, "r_y2": 291.15842, "r_x3": 50.112, "r_y3": 291.15842, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.01996, "r_x1": 286.36511, "r_y1": 312.01996, "r_x2": 286.36511, "r_y2": 303.1134, "r_x3": 50.112, "r_y3": 303.1134, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 323.97495, "r_x1": 286.36511, "r_y1": 323.97495, "r_x2": 286.36511, "r_y2": 315.06839, "r_x3": 50.112, "r_y3": 315.06839, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 335.93093999999996, "r_x1": 286.36511, "r_y1": 335.93093999999996, "r_x2": 286.36511, "r_y2": 327.02438, "r_x3": 50.112, "r_y3": 327.02438, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 347.88593, "r_x1": 286.36505, "r_y1": 347.88593, "r_x2": 286.36505, "r_y2": 338.97937, "r_x3": 50.112, "r_y3": 338.97937, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.84091, "r_x1": 286.36508, "r_y1": 359.84091, "r_x2": 286.36508, "r_y2": 350.93436, "r_x3": 50.112, "r_y3": 350.93436, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.7959, "r_x1": 286.36511, "r_y1": 371.7959, "r_x2": 286.36511, "r_y2": 362.88934, "r_x3": 50.112, "r_y3": 362.88934, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 383.75089, "r_x1": 286.36508, "r_y1": 383.75089, "r_x2": 286.36508, "r_y2": 374.84433000000007, "r_x3": 50.112, "r_y3": 374.84433000000007, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 395.70688, "r_x1": 154.55988, "r_y1": 395.70688, "r_x2": 154.55988, "r_y2": 386.80032, "r_x3": 50.112, "r_y3": 386.80032, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes." }, { "label": "text", "id": 11, "page_no": 11, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.112, "t": 399.06934, "r": 286.36496, "b": 419.93188, "coord_origin": "TOPLEFT" }, "confidence": 0.934766411781311, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 407.97589, "r_x1": 286.36496, "r_y1": 407.97589, "r_x2": 286.36496, "r_y2": 399.06934, "r_x3": 62.067001, "r_y3": 399.06934, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 419.93188, "r_x1": 95.491638, "r_y1": 419.93188, "r_x2": 95.491638, "r_y2": 411.02533, "r_x3": 50.112, "r_y3": 411.02533, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Here is a step-by-step description of the prediction postprocessing:" }, { "label": "list_item", "id": 20, "page_no": 11, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 50.112, "t": 423.29532, "r": 286.36508, "b": 456.11185000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.8280702233314514, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 432.20187, "r_x1": 69.37281, "r_y1": 432.20187, "r_x2": 69.37281, "r_y2": 423.29532, "r_x3": 62.067001, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.808075, "r_y0": 432.20187, "r_x1": 286.36502, "r_y1": 432.20187, "r_x2": 286.36502, "r_y2": 423.29532, "r_x3": 71.808075, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 444.15686, "r_x1": 286.36508, "r_y1": 444.15686, "r_x2": 286.36508, "r_y2": 435.25031, "r_x3": 50.112, "r_y3": 435.25031, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 456.11185000000006, "r_x1": 274.50958, "r_y1": 456.11185000000006, "r_x2": 274.50958, "r_y2": 447.20529, "r_x3": 50.112, "r_y3": 447.20529, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure." }, { "label": "list_item", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.112, "t": 459.47528, "r": 286.36505, "b": 504.2468, "coord_origin": "TOPLEFT" }, "confidence": 0.9646760821342468, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 468.38184, "r_x1": 69.538948, "r_y1": 468.38184, "r_x2": 69.538948, "r_y2": 459.47528, "r_x3": 62.067001, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.429329, "r_y0": 468.38184, "r_x1": 286.36499, "r_y1": 468.38184, "r_x2": 286.36499, "r_y2": 459.47528, "r_x3": 77.429329, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 480.33682, "r_x1": 286.36505, "r_y1": 480.33682, "r_x2": 286.36505, "r_y2": 471.43027, "r_x3": 50.112, "r_y3": 471.43027, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.29181, "r_x1": 286.36505, "r_y1": 492.29181, "r_x2": 286.36505, "r_y2": 483.38525, "r_x3": 50.112, "r_y3": 483.38525, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 504.2468, "r_x1": 110.70452999999999, "r_y1": 504.2468, "r_x2": 110.70452999999999, "r_y2": 495.34024, "r_x3": 50.112, "r_y3": 495.34024, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches." }, { "label": "list_item", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.112, "t": 507.61023, "r": 286.36493, "b": 528.4727800000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9391399025917053, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 516.5167799999999, "r_x1": 69.863068, "r_y1": 516.5167799999999, "r_x2": 69.863068, "r_y2": 507.61023, "r_x3": 62.067001, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.461754, "r_y0": 516.5167799999999, "r_x1": 286.36493, "r_y1": 516.5167799999999, "r_x2": 286.36493, "r_y2": 507.61023, "r_x3": 72.461754, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 528.4727800000001, "r_x1": 226.0714, "r_y1": 528.4727800000001, "r_x2": 226.0714, "r_y2": 519.5662199999999, "r_x3": 50.112, "r_y3": 519.5662199999999, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones." }, { "label": "list_item", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.112, "t": 531.83521, "r": 286.36511, "b": 564.65277, "coord_origin": "TOPLEFT" }, "confidence": 0.9491708874702454, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 540.7417800000001, "r_x1": 286.36496, "r_y1": 540.7417800000001, "r_x2": 286.36496, "r_y2": 531.83521, "r_x3": 62.067001, "r_y3": 531.83521, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 552.69777, "r_x1": 286.36511, "r_y1": 552.69777, "r_x2": 286.36511, "r_y2": 543.79121, "r_x3": 50.112, "r_y3": 543.79121, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 564.65277, "r_x1": 114.03204, "r_y1": 564.65277, "r_x2": 114.03204, "r_y2": 555.74622, "r_x3": 50.112, "r_y3": 555.74622, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column." }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.112, "t": 568.01622, "r": 286.36508, "b": 600.83278, "coord_origin": "TOPLEFT" }, "confidence": 0.9587163329124451, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 576.92278, "r_x1": 69.538948, "r_y1": 576.92278, "r_x2": 69.538948, "r_y2": 568.01622, "r_x3": 62.067001, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.731949, "r_y0": 576.92278, "r_x1": 286.36502, "r_y1": 576.92278, "r_x2": 286.36502, "r_y2": 568.01622, "r_x3": 76.731949, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 588.87778, "r_x1": 286.36508, "r_y1": 588.87778, "r_x2": 286.36508, "r_y2": 579.97122, "r_x3": 50.112, "r_y3": 579.97122, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 600.83278, "r_x1": 278.70383, "r_y1": 600.83278, "r_x2": 278.70383, "r_y2": 591.9262200000001, "r_x3": 50.112, "r_y3": 591.9262200000001, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:" }, { "label": "formula", "id": 12, "page_no": 11, "cluster": { "id": 12, "label": "formula", "bbox": { "l": 110.70499, "t": 623.43591, "r": 286.3624, "b": 654.1056100000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9298412799835205, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.02799999999999, "r_y0": 632.84061, "r_x1": 157.9516, "r_y1": 632.84061, "r_x2": 157.9516, "r_y2": 623.99382, "r_x3": 112.02799999999999, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.715, "r_y0": 632.84061, "r_x1": 203.4964, "r_y1": 632.84061, "r_x2": 203.4964, "r_y2": 623.99382, "r_x3": 160.715, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58499, "r_y0": 640.17578, "r_x1": 189.14511, "r_y1": 640.17578, "r_x2": 189.14511, "r_y2": 633.98305, "r_x3": 185.58499, "r_y3": 633.98305, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.49899, "r_y0": 632.84061, "r_x1": 208.48029, "r_y1": 632.84061, "r_x2": 208.48029, "r_y2": 623.43591, "r_x3": 203.49899, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48099, "r_y0": 632.84061, "r_x1": 220.28911, "r_y1": 632.84061, "r_x2": 220.28911, "r_y2": 623.99382, "r_x3": 208.48099, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.78699, "r_y0": 632.84061, "r_x1": 225.76828, "r_y1": 632.84061, "r_x2": 225.76828, "r_y2": 623.43591, "r_x3": 220.78699, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.70499, "r_y0": 654.1056100000001, "r_x1": 122.51310999999998, "r_y1": 654.1056100000001, "r_x2": 122.51310999999998, "r_y2": 645.25882, "r_x3": 110.70499, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.77899000000001, "r_y0": 654.1056100000001, "r_x1": 133.52791, "r_y1": 654.1056100000001, "r_x2": 133.52791, "r_y2": 645.25882, "r_x3": 125.77899000000001, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.295, "r_y0": 654.1056100000001, "r_x1": 156.00201, "r_y1": 654.1056100000001, "r_x2": 156.00201, "r_y2": 645.25882, "r_x3": 136.295, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.00299, "r_y0": 654.1056100000001, "r_x1": 160.98428, "r_y1": 654.1056100000001, "r_x2": 160.98428, "r_y2": 644.70091, "r_x3": 156.00299, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98399, "r_y0": 654.1056100000001, "r_x1": 170.23811, "r_y1": 654.1056100000001, "r_x2": 170.23811, "r_y2": 645.25882, "r_x3": 160.98399, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.73599, "r_y0": 654.1056100000001, "r_x1": 185.6779, "r_y1": 654.1056100000001, "r_x2": 185.6779, "r_y2": 644.70091, "r_x3": 170.73599, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.894, "r_y0": 654.1056100000001, "r_x1": 206.05283, "r_y1": 654.1056100000001, "r_x2": 206.05283, "r_y2": 645.25882, "r_x3": 187.894, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.054, "r_y0": 654.1056100000001, "r_x1": 211.03529, "r_y1": 654.1056100000001, "r_x2": 211.03529, "r_y2": 644.70091, "r_x3": 206.054, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.035, "r_y0": 654.1056100000001, "r_x1": 220.28912, "r_y1": 654.1056100000001, "r_x2": 220.28912, "r_y2": 645.25882, "r_x3": 211.035, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.787, "r_y0": 654.1056100000001, "r_x1": 225.76829999999998, "r_y1": 654.1056100000001, "r_x2": 225.76829999999998, "r_y2": 644.70091, "r_x3": 220.787, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 643.79178, "r_x1": 286.3624, "r_y1": 643.79178, "r_x2": 286.3624, "r_y2": 634.88522, "r_x3": 274.746, "r_y3": 634.88522, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)" }, { "label": "text", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.112, "t": 667.3479199999999, "r": 286.362, "b": 688.92679, "coord_origin": "TOPLEFT" }, "confidence": 0.9545555114746094, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 676.97179, "r_x1": 74.45063, "r_y1": 676.97179, "r_x2": 74.45063, "r_y2": 668.06522, "r_x3": 50.112, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.335999, "r_y0": 676.75261, "r_x1": 82.647812, "r_y1": 676.75261, "r_x2": 82.647812, "r_y2": 667.90582, "r_x3": 78.335999, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.532997, "r_y0": 676.97179, "r_x1": 123.63372, "r_y1": 676.97179, "r_x2": 123.63372, "r_y2": 668.06522, "r_x3": 86.532997, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.51899999999999, "r_y0": 676.75261, "r_x1": 132.50029, "r_y1": 676.75261, "r_x2": 132.50029, "r_y2": 667.3479199999999, "r_x3": 127.51899999999999, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.50099, "r_y0": 676.97179, "r_x1": 210.69743, "r_y1": 676.97179, "r_x2": 210.69743, "r_y2": 668.06522, "r_x3": 132.50099, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.69699, "r_y0": 676.75261, "r_x1": 215.67828, "r_y1": 676.75261, "r_x2": 215.67828, "r_y2": 667.3479199999999, "r_x3": 210.69699, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56299, "r_y0": 676.97179, "r_x1": 233.94897000000003, "r_y1": 676.97179, "r_x2": 233.94897000000003, "r_y2": 668.06522, "r_x3": 219.56299, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83499000000003, "r_y0": 676.75261, "r_x1": 247.08911, "r_y1": 676.75261, "r_x2": 247.08911, "r_y2": 667.90582, "r_x3": 237.83499000000003, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47299000000004, "r_y0": 676.97179, "r_x1": 286.362, "r_y1": 676.97179, "r_x2": 286.362, "r_y2": 668.06522, "r_x3": 251.47299000000004, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 688.92679, "r_x1": 205.88721, "r_y1": 688.92679, "r_x2": 205.88721, "r_y2": 680.02022, "r_x3": 50.112, "r_y3": 680.02022, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point." }, { "label": "list_item", "id": 13, "page_no": 11, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.112, "t": 692.290222, "r": 286.36496, "b": 713.151787, "coord_origin": "TOPLEFT" }, "confidence": 0.9260510206222534, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 701.196785, "r_x1": 69.538948, "r_y1": 701.196785, "r_x2": 69.538948, "r_y2": 692.290222, "r_x3": 62.067001, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.273666, "r_y0": 701.196785, "r_x1": 286.36496, "r_y1": 701.196785, "r_x2": 286.36496, "r_y2": 692.290222, "r_x3": 76.273666, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.151787, "r_x1": 94.604973, "r_y1": 713.151787, "r_x2": 94.604973, "r_y2": 704.245224, "r_x3": 50.112, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.598999, "r_y0": 712.93261, "r_x1": 103.29263, "r_y1": 712.93261, "r_x2": 103.29263, "r_y2": 704.085815, "r_x3": 97.598999, "r_y3": 704.085815, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.292, "r_y0": 713.151787, "r_x1": 286.36481, "r_y1": 713.151787, "r_x2": 286.36481, "r_y2": 704.245224, "r_x3": 103.292, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-" }, { "label": "text", "id": 16, "page_no": 11, "cluster": { "id": 16, "label": "text", "bbox": { "l": 308.862, "t": 210.93120999999996, "r": 545.11517, "b": 255.7038, "coord_origin": "TOPLEFT" }, "confidence": 0.8942298889160156, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 219.83776999999998, "r_x1": 545.11517, "r_y1": 219.83776999999998, "r_x2": 545.11517, "r_y2": 210.93120999999996, "r_x3": 308.862, "r_y3": 210.93120999999996, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 231.79376000000002, "r_x1": 545.11511, "r_y1": 231.79376000000002, "r_x2": 545.11511, "r_y2": 222.88720999999998, "r_x3": 308.862, "r_y3": 222.88720999999998, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 243.74878, "r_x1": 545.11511, "r_y1": 243.74878, "r_x2": 545.11511, "r_y2": 234.84222, "r_x3": 308.862, "r_y3": 234.84222, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 255.7038, "r_x1": 339.57669, "r_y1": 255.7038, "r_x2": 339.57669, "r_y2": 246.79724, "r_x3": 308.862, "r_y3": 246.79724, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal." }, { "label": "list_item", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 259.10222999999996, "r": 545.11499, "b": 279.96380999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9423392415046692, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 268.00879, "r_x1": 328.28894, "r_y1": 268.00879, "r_x2": 328.28894, "r_y2": 259.10222999999996, "r_x3": 320.81699, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88419, "r_y0": 268.00879, "r_x1": 545.11499, "r_y1": 268.00879, "r_x2": 545.11499, "r_y2": 259.10222999999996, "r_x3": 334.88419, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 279.96380999999997, "r_x1": 338.19189, "r_y1": 279.96380999999997, "r_x2": 338.19189, "r_y2": 271.05724999999995, "r_x3": 308.862, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68201, "r_y0": 279.74463000000003, "r_x1": 346.37564, "r_y1": 279.74463000000003, "r_x2": 346.37564, "r_y2": 270.89783, "r_x3": 340.68201, "r_y3": 270.89783, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37601, "r_y0": 279.96380999999997, "r_x1": 453.72305000000006, "r_y1": 279.96380999999997, "r_x2": 453.72305000000006, "r_y2": 271.05724999999995, "r_x3": 346.37601, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes." }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86203, "t": 283.36325000000005, "r": 545.11511, "b": 387.91071, "coord_origin": "TOPLEFT" }, "confidence": 0.9562004804611206, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 292.26981, "r_x1": 328.38953, "r_y1": 292.26981, "r_x2": 328.38953, "r_y2": 283.36325000000005, "r_x3": 320.81702, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.9137, "r_y0": 292.26981, "r_x1": 545.11499, "r_y1": 292.26981, "r_x2": 545.11499, "r_y2": 283.36325000000005, "r_x3": 330.9137, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 304.22479, "r_x1": 545.11511, "r_y1": 304.22479, "r_x2": 545.11511, "r_y2": 295.31824, "r_x3": 308.86203, "r_y3": 295.31824, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 316.17978, "r_x1": 545.11505, "r_y1": 316.17978, "r_x2": 545.11505, "r_y2": 307.27322, "r_x3": 308.86203, "r_y3": 307.27322, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 328.13477, "r_x1": 545.11511, "r_y1": 328.13477, "r_x2": 545.11511, "r_y2": 319.22821000000005, "r_x3": 308.86203, "r_y3": 319.22821000000005, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 340.09076000000005, "r_x1": 397.19043, "r_y1": 340.09076000000005, "r_x2": 397.19043, "r_y2": 331.1842, "r_x3": 308.86203, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.65616, "r_y0": 340.09076000000005, "r_x1": 545.11511, "r_y1": 340.09076000000005, "r_x2": 545.11511, "r_y2": 331.1842, "r_x3": 403.65616, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 352.04575, "r_x1": 545.11511, "r_y1": 352.04575, "r_x2": 545.11511, "r_y2": 343.13919, "r_x3": 308.86203, "r_y3": 343.13919, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 364.00073, "r_x1": 545.11505, "r_y1": 364.00073, "r_x2": 545.11505, "r_y2": 355.09418, "r_x3": 308.86203, "r_y3": 355.09418, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 375.95572000000004, "r_x1": 545.11505, "r_y1": 375.95572000000004, "r_x2": 545.11505, "r_y2": 367.04916, "r_x3": 308.86203, "r_y3": 367.04916, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 387.91071, "r_x1": 329.61414, "r_y1": 387.91071, "r_x2": 329.61414, "r_y2": 379.00415, "r_x3": 308.86203, "r_y3": 379.00415, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells." }, { "label": "list_item", "id": 17, "page_no": 11, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 308.86203, "t": 391.31015, "r": 545.11517, "b": 459.99164, "coord_origin": "TOPLEFT" }, "confidence": 0.8719939589500427, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 400.2167099999999, "r_x1": 328.55356, "r_y1": 400.2167099999999, "r_x2": 328.55356, "r_y2": 391.31015, "r_x3": 320.81702, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13242, "r_y0": 400.2167099999999, "r_x1": 545.11505, "r_y1": 400.2167099999999, "r_x2": 545.11505, "r_y2": 391.31015, "r_x3": 331.13242, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 412.17169, "r_x1": 545.11517, "r_y1": 412.17169, "r_x2": 545.11517, "r_y2": 403.26514, "r_x3": 308.86203, "r_y3": 403.26514, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 424.12668, "r_x1": 545.11511, "r_y1": 424.12668, "r_x2": 545.11511, "r_y2": 415.22012000000007, "r_x3": 308.86203, "r_y3": 415.22012000000007, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 436.0816699999999, "r_x1": 545.11511, "r_y1": 436.0816699999999, "r_x2": 545.11511, "r_y2": 427.17511, "r_x3": 308.86203, "r_y3": 427.17511, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 448.03665, "r_x1": 545.11505, "r_y1": 448.03665, "r_x2": 545.11505, "r_y2": 439.1301, "r_x3": 308.86203, "r_y3": 439.1301, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 459.99164, "r_x1": 426.18161, "r_y1": 459.99164, "r_x2": 426.18161, "r_y2": 451.08507999999995, "r_x3": 308.86203, "r_y3": 451.08507999999995, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score." }, { "label": "list_item", "id": 15, "page_no": 11, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.86203, "t": 463.39108, "r": 545.11517, "b": 567.93858, "coord_origin": "TOPLEFT" }, "confidence": 0.9126082062721252, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 472.29764, "r_x1": 328.67316, "r_y1": 472.29764, "r_x2": 328.67316, "r_y2": 463.39108, "r_x3": 320.81702, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29187, "r_y0": 472.29764, "r_x1": 545.11499, "r_y1": 472.29764, "r_x2": 545.11499, "r_y2": 463.39108, "r_x3": 331.29187, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 484.25262, "r_x1": 545.11505, "r_y1": 484.25262, "r_x2": 545.11505, "r_y2": 475.34607, "r_x3": 308.86203, "r_y3": 475.34607, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 496.20761, "r_x1": 545.11517, "r_y1": 496.20761, "r_x2": 545.11517, "r_y2": 487.30106, "r_x3": 308.86203, "r_y3": 487.30106, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 508.1626, "r_x1": 381.89786, "r_y1": 508.1626, "r_x2": 381.89786, "r_y2": 499.25604, "r_x3": 308.86203, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7023, "r_y0": 508.1626, "r_x1": 545.11517, "r_y1": 508.1626, "r_x2": 545.11517, "r_y2": 499.25604, "r_x3": 388.7023, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 520.11859, "r_x1": 545.11511, "r_y1": 520.11859, "r_x2": 545.11511, "r_y2": 511.21204, "r_x3": 308.86203, "r_y3": 511.21204, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 532.07358, "r_x1": 545.11505, "r_y1": 532.07358, "r_x2": 545.11505, "r_y2": 523.16702, "r_x3": 308.86203, "r_y3": 523.16702, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 544.02858, "r_x1": 545.11499, "r_y1": 544.02858, "r_x2": 545.11499, "r_y2": 535.12201, "r_x3": 308.86203, "r_y3": 535.12201, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 555.98358, "r_x1": 545.11517, "r_y1": 555.98358, "r_x2": 545.11517, "r_y2": 547.07703, "r_x3": 308.86203, "r_y3": 547.07703, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 567.93858, "r_x1": 442.22147000000007, "r_y1": 567.93858, "r_x2": 442.22147000000007, "r_y2": 559.03203, "r_x3": 308.86203, "r_y3": 559.03203, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan." }, { "label": "text", "id": 19, "page_no": 11, "cluster": { "id": 19, "label": "text", "bbox": { "l": 308.86203, "t": 571.33803, "r": 545.11688, "b": 604.15459, "coord_origin": "TOPLEFT" }, "confidence": 0.8459473848342896, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 580.24458, "r_x1": 545.11493, "r_y1": 580.24458, "r_x2": 545.11493, "r_y2": 571.33803, "r_x3": 320.81702, "r_y3": 571.33803, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 592.19958, "r_x1": 471.64093, "r_y1": 592.19958, "r_x2": 471.64093, "r_y2": 583.29303, "r_x3": 308.86203, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83405, "r_y0": 591.98041, "r_x1": 479.71872, "r_y1": 591.98041, "r_x2": 479.71872, "r_y2": 583.1336200000001, "r_x3": 474.83405, "r_y3": 583.1336200000001, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.26903999999996, "r_y0": 592.19958, "r_x1": 545.11688, "r_y1": 592.19958, "r_x2": 545.11688, "r_y2": 583.29303, "r_x3": 483.26903999999996, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 604.15459, "r_x1": 329.91306, "r_y1": 604.15459, "r_x2": 329.91306, "r_y2": 595.24803, "r_x3": 308.86206, "r_y3": 595.24803, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)." }, { "label": "list_item", "id": 21, "page_no": 11, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.86206, "t": 607.55304, "r": 545.11505, "b": 628.4155900000001, "coord_origin": "TOPLEFT" }, "confidence": 0.7716891169548035, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 616.4595899999999, "r_x1": 332.8718, "r_y1": 616.4595899999999, "r_x2": 332.8718, "r_y2": 607.55304, "r_x3": 320.81705, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.92532, "r_y0": 616.4595899999999, "r_x1": 545.11505, "r_y1": 616.4595899999999, "r_x2": 545.11505, "r_y2": 607.55304, "r_x3": 339.92532, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 628.4155900000001, "r_x1": 495.2923, "r_y1": 628.4155900000001, "r_x2": 495.2923, "r_y2": 619.50903, "r_x3": 308.86206, "r_y3": 619.50903, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row." }, { "label": "list_item", "id": 18, "page_no": 11, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.86206, "t": 631.81403, "r": 545.11505, "b": 664.63059, "coord_origin": "TOPLEFT" }, "confidence": 0.8584907054901123, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 640.72058, "r_x1": 545.11505, "r_y1": 640.72058, "r_x2": 545.11505, "r_y2": 631.81403, "r_x3": 320.81705, "r_y3": 631.81403, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 652.67558, "r_x1": 455.28238, "r_y1": 652.67558, "r_x2": 455.28238, "r_y2": 643.7690299999999, "r_x3": 308.86206, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.77704, "r_y0": 652.45641, "r_x1": 463.47067, "r_y1": 652.45641, "r_x2": 463.47067, "r_y2": 643.60962, "r_x3": 457.77704, "r_y3": 643.60962, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97104, "r_y0": 652.67558, "r_x1": 545.11389, "r_y1": 652.67558, "r_x2": 545.11389, "r_y2": 643.7690299999999, "r_x3": 465.97104, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 664.63059, "r_x1": 332.38376, "r_y1": 664.63059, "r_x2": 332.38376, "r_y2": 655.72403, "r_x3": 308.86206, "r_y3": 655.72403, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)." }, { "label": "list_item", "id": 22, "page_no": 11, "cluster": { "id": 22, "label": "list_item", "bbox": { "l": 308.86206, "t": 668.03003, "r": 545.11499, "b": 688.89159, "coord_origin": "TOPLEFT" }, "confidence": 0.7590745091438293, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 676.93659, "r_x1": 545.11499, "r_y1": 676.93659, "r_x2": 545.11499, "r_y2": 668.03003, "r_x3": 320.81705, "r_y3": 668.03003, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 688.89159, "r_x1": 510.5848700000001, "r_y1": 688.89159, "r_x2": 510.5848700000001, "r_y2": 679.98503, "r_x3": 308.86206, "r_y3": 679.98503, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column." }, { "label": "list_item", "id": 25, "page_no": 11, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 308.86206, "t": 692.290024, "r": 545.11517, "b": 713.151596, "coord_origin": "TOPLEFT" }, "confidence": 0.6971189975738525, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 701.196594, "r_x1": 545.11505, "r_y1": 701.196594, "r_x2": 545.11505, "r_y2": 692.290024, "r_x3": 320.81705, "r_y3": 692.290024, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 713.151596, "r_x1": 545.11517, "r_y1": 713.151596, "r_x2": 545.11517, "r_y2": 704.245026, "r_x3": 308.86206, "r_y3": 704.245026, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-" }, { "label": "page_footer", "id": 14, "page_no": 11, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 292.63107, "t": 734.13303, "r": 302.59366, "b": 743.039593, "coord_origin": "TOPLEFT" }, "confidence": 0.9126598238945007, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63107, "r_y0": 743.039593, "r_x1": 302.59366, "r_y1": 743.039593, "r_x2": 302.59366, "r_y2": 734.13303, "r_x3": 292.63107, "r_y3": 734.13303, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" } ], "body": [ { "label": "picture", "id": 30, "page_no": 11, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT" }, "confidence": 0.6033818125724792, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39108, "r_y0": 83.25922000000003, "r_x1": 151.94641, "r_y1": 83.25922000000003, "r_x2": 151.94641, "r_y2": 77.31055000000003, "r_x3": 119.39108, "r_y3": 77.31055000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.345978, "r_y0": 81.14020000000005, "r_x1": 59.327053, "r_y1": 81.14020000000005, "r_x2": 59.327053, "r_y2": 75.19152999999994, "r_x3": 53.345978, "r_y3": 75.19152999999994, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.5791, "r_y0": 83.40698000000009, "r_x1": 319.8266, "r_y1": 83.40698000000009, "r_x2": 319.8266, "r_y2": 77.45830999999998, "r_x3": 289.5791, "r_y3": 77.45830999999998, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37271, "r_y0": 83.20263999999997, "r_x1": 481.75916, "r_y1": 83.20263999999997, "r_x2": 481.75916, "r_y2": 77.25396999999987, "r_x3": 448.37271, "r_y3": 77.25396999999987, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.553436, "r_y0": 146.23339999999996, "r_x1": 94.976013, "r_y1": 146.23339999999996, "r_x2": 94.976013, "r_y2": 141.27617999999995, "r_x3": 82.553436, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.03878399999999, "r_y0": 106.06133999999986, "r_x1": 85.290085, "r_y1": 106.06133999999986, "r_x2": 85.290085, "r_y2": 101.10413000000005, "r_x3": 63.03878399999999, "r_y3": 101.10413000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.76786, "r_y0": 129.35253999999998, "r_x1": 85.231277, "r_y1": 129.35253999999998, "r_x2": 85.231277, "r_y2": 124.39531999999997, "r_x3": 67.76786, "r_y3": 124.39531999999997, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55121, "r_y0": 107.49712999999997, "r_x1": 249.80251, "r_y1": 107.49712999999997, "r_x2": 249.80251, "r_y2": 102.53992000000005, "r_x3": 227.55121, "r_y3": 102.53992000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.19898999999998, "r_y0": 131.94299, "r_x1": 249.66241, "r_y1": 131.94299, "r_x2": 249.66241, "r_y2": 126.98577999999986, "r_x3": 232.19898999999998, "r_y3": 126.98577999999986, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2337, "r_y0": 119.00243999999998, "r_x1": 413.69711, "r_y1": 119.00243999999998, "r_x2": 413.69711, "r_y2": 114.04522999999995, "r_x3": 396.2337, "r_y3": 114.04522999999995, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.382202, "r_y0": 146.23339999999996, "r_x1": 105.08014, "r_y1": 146.23339999999996, "r_x2": 105.08014, "r_y2": 141.27617999999995, "r_x3": 97.382202, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.93763400000001, "r_y0": 90.69042999999999, "r_x1": 76.151443, "r_y1": 90.69042999999999, "r_x2": 76.151443, "r_y2": 85.73321999999996, "r_x3": 60.93763400000001, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.304901, "r_y0": 91.18073000000015, "r_x1": 106.99162, "r_y1": 91.18073000000015, "r_x2": 106.99162, "r_y2": 86.22351000000003, "r_x3": 82.304901, "r_y3": 86.22351000000003, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.20530999999997, "r_y0": 146.56329000000005, "r_x1": 281.88013, "r_y1": 146.56329000000005, "r_x2": 281.88013, "r_y2": 141.60608000000002, "r_x3": 246.20530999999997, "r_y3": 141.60608000000002, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.69780000000003, "r_y0": 90.69042999999999, "r_x1": 241.91161, "r_y1": 90.69042999999999, "r_x2": 241.91161, "r_y2": 85.73321999999996, "r_x3": 226.69780000000003, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.93848999999997, "r_y0": 91.04522999999995, "r_x1": 282.49384, "r_y1": 91.04522999999995, "r_x2": 282.49384, "r_y2": 86.08801000000005, "r_x3": 249.93848999999997, "r_y3": 86.08801000000005, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19409, "r_y0": 146.23339999999996, "r_x1": 444.68915, "r_y1": 146.23339999999996, "r_x2": 444.68915, "r_y2": 141.27617999999995, "r_x3": 410.19409, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37341, "r_y0": 90.69042999999999, "r_x1": 432.6716599999999, "r_y1": 90.69042999999999, "r_x2": 432.6716599999999, "r_y2": 85.73321999999996, "r_x3": 391.37341, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.60571000000004, "r_y0": 91.21862999999996, "r_x1": 445.62414999999993, "r_y1": 91.21862999999996, "r_x2": 445.62414999999993, "r_y2": 86.26140999999996, "r_x3": 435.60571000000004, "r_y3": 86.26140999999996, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.94921, "r_y0": 146.24567000000002, "r_x1": 136.20052, "r_y1": 146.24567000000002, "r_x2": 136.20052, "r_y2": 141.28845, "r_x3": 113.94921, "r_y3": 141.28845, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.91554000000001, "r_y0": 99.77575999999999, "r_x1": 127.05433999999998, "r_y1": 99.77575999999999, "r_x2": 127.05433999999998, "r_y2": 94.81853999999998, "r_x3": 116.91554000000001, "r_y3": 94.81853999999998, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.3146, "r_y0": 105.89575000000002, "r_x1": 127.05298, "r_y1": 105.89575000000002, "r_x2": 127.05298, "r_y2": 100.93853999999999, "r_x3": 113.3146, "r_y3": 100.93853999999999, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94112, "r_y0": 112.01575000000003, "r_x1": 127.05537, "r_y1": 112.01575000000003, "r_x2": 127.05537, "r_y2": 107.05853000000013, "r_x3": 112.94112, "r_y3": 107.05853000000013, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.22738999999999, "r_y0": 127.57245, "r_x1": 126.96577, "r_y1": 127.57245, "r_x2": 126.96577, "r_y2": 122.61523, "r_x3": 113.22738999999999, "r_y3": 122.61523, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85390000000001, "r_y0": 133.69244000000003, "r_x1": 126.96814999999998, "r_y1": 133.69244000000003, "r_x2": 126.96814999999998, "r_y2": 128.73523, "r_x3": 112.85390000000001, "r_y3": 128.73523, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.57864, "r_y0": 146.39362000000006, "r_x1": 156.04207, "r_y1": 146.39362000000006, "r_x2": 156.04207, "r_y2": 141.43640000000005, "r_x3": 138.57864, "r_y3": 141.43640000000005, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03101, "r_y0": 91.22852, "r_x1": 151.04185, "r_y1": 91.22852, "r_x2": 151.04185, "r_y2": 86.2713, "r_x3": 122.03101, "r_y3": 86.2713, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65359, "r_y0": 91.5122100000001, "r_x1": 321.67203, "r_y1": 91.5122100000001, "r_x2": 321.67203, "r_y2": 86.55498999999998, "r_x3": 311.65359, "r_y3": 86.55498999999998, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89441, "r_y0": 146.66785000000004, "r_x1": 310.14572, "r_y1": 146.66785000000004, "r_x2": 310.14572, "r_y2": 141.71063000000004, "r_x3": 287.89441, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.23572, "r_y0": 98.03698999999995, "r_x1": 299.37451, "r_y1": 98.03698999999995, "r_x2": 299.37451, "r_y2": 93.07977000000005, "r_x3": 289.23572, "r_y3": 93.07977000000005, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63513, "r_y0": 104.15698000000009, "r_x1": 299.3735, "r_y1": 104.15698000000009, "r_x2": 299.3735, "r_y2": 99.19976999999994, "r_x3": 285.63513, "r_y3": 99.19976999999994, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26111, "r_y0": 110.27697999999998, "r_x1": 299.37537, "r_y1": 110.27697999999998, "r_x2": 299.37537, "r_y2": 105.31975999999997, "r_x3": 285.26111, "r_y3": 105.31975999999997, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43109, "r_y0": 125.34717, "r_x1": 299.16946, "r_y1": 125.34717, "r_x2": 299.16946, "r_y2": 120.38995, "r_x3": 285.43109, "r_y3": 120.38995, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.05713, "r_y0": 131.46716000000004, "r_x1": 299.17139, "r_y1": 131.46716000000004, "r_x2": 299.17139, "r_y2": 126.50995, "r_x3": 285.05713, "r_y3": 126.50995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.34592, "r_y0": 146.66785000000004, "r_x1": 328.80933, "r_y1": 146.66785000000004, "r_x2": 328.80933, "r_y2": 141.71063000000004, "r_x3": 311.34592, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58362, "r_y0": 91.65075999999999, "r_x1": 309.60205, "r_y1": 91.65075999999999, "r_x2": 309.60205, "r_y2": 86.69353999999998, "r_x3": 299.58362, "r_y3": 86.69353999999998, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04077000000007, "r_y0": 146.62891000000002, "r_x1": 483.50418, "r_y1": 146.62891000000002, "r_x2": 483.50418, "r_y2": 141.67169, "r_x3": 466.04077000000007, "r_y3": 141.67169, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02151, "r_y0": 98.71838000000002, "r_x1": 469.16031000000004, "r_y1": 98.71838000000002, "r_x2": 469.16031000000004, "r_y2": 93.76116999999999, "r_x3": 459.02151, "r_y3": 93.76116999999999, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.4209, "r_y0": 104.83838000000003, "r_x1": 469.15927000000005, "r_y1": 104.83838000000003, "r_x2": 469.15927000000005, "r_y2": 99.88116000000002, "r_x3": 455.4209, "r_y3": 99.88116000000002, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.04691, "r_y0": 110.95836999999995, "r_x1": 469.16115999999994, "r_y1": 110.95836999999995, "r_x2": 469.16115999999994, "r_y2": 106.00116000000014, "r_x3": 455.04691, "r_y3": 106.00116000000014, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39401, "r_y0": 90.52959999999996, "r_x1": 480.6545100000001, "r_y1": 90.52959999999996, "r_x2": 480.6545100000001, "r_y2": 85.57239000000004, "r_x3": 467.39401, "r_y3": 85.57239000000004, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37672, "r_y0": 146.54107999999997, "r_x1": 182.62802, "r_y1": 146.54107999999997, "r_x2": 182.62802, "r_y2": 141.58385999999996, "r_x3": 160.37672, "r_y3": 141.58385999999996, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74265, "r_y0": 99.82201999999995, "r_x1": 173.32664, "r_y1": 99.82201999999995, "r_x2": 173.32664, "r_y2": 94.86481000000003, "r_x3": 153.74265, "r_y3": 94.86481000000003, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50967, "r_y0": 105.94202000000007, "r_x1": 173.3246, "r_y1": 105.94202000000007, "r_x2": 173.3246, "r_y2": 100.98479999999995, "r_x3": 154.50967, "r_y3": 100.98479999999995, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27162, "r_y0": 112.06200999999987, "r_x1": 173.32664, "r_y1": 112.06200999999987, "r_x2": 173.32664, "r_y2": 107.10479999999995, "r_x3": 155.27162, "r_y3": 107.10479999999995, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41302, "r_y0": 112.18970000000002, "r_x1": 345.99701, "r_y1": 112.18970000000002, "r_x2": 345.99701, "r_y2": 107.23248000000001, "r_x3": 326.41302, "r_y3": 107.23248000000001, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.17972, "r_y0": 118.30969000000005, "r_x1": 345.99463, "r_y1": 118.30969000000005, "r_x2": 345.99463, "r_y2": 113.35248000000001, "r_x3": 327.17972, "r_y3": 113.35248000000001, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94131, "r_y0": 124.42969000000005, "r_x1": 345.99634, "r_y1": 124.42969000000005, "r_x2": 345.99634, "r_y2": 119.47247000000004, "r_x3": 327.94131, "r_y3": 119.47247000000004, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.9942, "r_y0": 109.11095999999998, "r_x1": 508.76384999999993, "r_y1": 109.11095999999998, "r_x2": 508.76384999999993, "r_y2": 104.15374999999983, "r_x3": 488.9942, "r_y3": 104.15374999999983, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.1893, "r_y0": 115.2309600000001, "r_x1": 508.76349000000005, "r_y1": 115.2309600000001, "r_x2": 508.76349000000005, "r_y2": 110.27373999999998, "r_x3": 490.1893, "r_y3": 110.27373999999998, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72009, "r_y0": 121.35095000000013, "r_x1": 508.76758, "r_y1": 121.35095000000013, "r_x2": 508.76758, "r_y2": 116.39373999999998, "r_x3": 489.72009, "r_y3": 116.39373999999998, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71121, "r_y0": 127.47095000000002, "r_x1": 508.76624, "r_y1": 127.47095000000002, "r_x2": 508.76624, "r_y2": 122.51373000000001, "r_x3": 490.71121, "r_y3": 122.51373000000001, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.37759, "r_y0": 146.66840000000002, "r_x1": 202.84102, "r_y1": 146.66840000000002, "r_x2": 202.84102, "r_y2": 141.71118, "r_x3": 185.37759, "r_y3": 141.71118, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.50357, "r_y0": 91.09331999999995, "r_x1": 197.52699, "r_y1": 91.09331999999995, "r_x2": 197.52699, "r_y2": 86.13611000000003, "r_x3": 168.50357, "r_y3": 86.13611000000003, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.3768, "r_y0": 90.95428000000004, "r_x1": 367.39523, "r_y1": 90.95428000000004, "r_x2": 367.39523, "r_y2": 85.99707000000001, "r_x3": 357.3768, "r_y3": 85.99707000000001, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73151, "r_y0": 146.58043999999995, "r_x1": 374.92862, "r_y1": 146.58043999999995, "r_x2": 374.92862, "r_y2": 141.62323000000004, "r_x3": 333.73151, "r_y3": 141.62323000000004, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69101, "r_y0": 91.01312000000007, "r_x1": 355.70944, "r_y1": 91.01312000000007, "r_x2": 355.70944, "r_y2": 86.05591000000004, "r_x3": 345.69101, "r_y3": 86.05591000000004, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54248, "r_y0": 146.33405000000005, "r_x1": 526.00592, "r_y1": 146.33405000000005, "r_x2": 526.00592, "r_y2": 141.37683000000004, "r_x3": 508.54248, "r_y3": 141.37683000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.44653000000005, "r_y0": 91.0498, "r_x1": 523.70703, "r_y1": 91.0498, "r_x2": 523.70703, "r_y2": 86.09258999999986, "r_x3": 510.44653000000005, "r_y3": 86.09258999999986, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 46, "label": "text", "bbox": { "l": 119.39108, "t": 77.31055000000003, "r": 151.94641, "b": 83.25922000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39108, "r_y0": 83.25922000000003, "r_x1": 151.94641, "r_y1": 83.25922000000003, "r_x2": 151.94641, "r_y2": 77.31055000000003, "r_x3": 119.39108, "r_y3": 77.31055000000003, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 53.345978, "t": 75.19152999999994, "r": 59.327053, "b": 81.14020000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.345978, "r_y0": 81.14020000000005, "r_x1": 59.327053, "r_y1": 81.14020000000005, "r_x2": 59.327053, "r_y2": 75.19152999999994, "r_x3": 53.345978, "r_y3": 75.19152999999994, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 289.5791, "t": 77.45830999999998, "r": 319.8266, "b": 83.40698000000009, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.5791, "r_y0": 83.40698000000009, "r_x1": 319.8266, "r_y1": 83.40698000000009, "r_x2": 319.8266, "r_y2": 77.45830999999998, "r_x3": 289.5791, "r_y3": 77.45830999999998, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 448.37271, "t": 77.25396999999987, "r": 481.75916, "b": 83.20263999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37271, "r_y0": 83.20263999999997, "r_x1": 481.75916, "r_y1": 83.20263999999997, "r_x2": 481.75916, "r_y2": 77.25396999999987, "r_x3": 448.37271, "r_y3": 77.25396999999987, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 82.553436, "t": 141.27617999999995, "r": 94.976013, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.553436, "r_y0": 146.23339999999996, "r_x1": 94.976013, "r_y1": 146.23339999999996, "r_x2": 94.976013, "r_y2": 141.27617999999995, "r_x3": 82.553436, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 63.03878399999999, "t": 101.10413000000005, "r": 85.290085, "b": 106.06133999999986, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.03878399999999, "r_y0": 106.06133999999986, "r_x1": 85.290085, "r_y1": 106.06133999999986, "r_x2": 85.290085, "r_y2": 101.10413000000005, "r_x3": 63.03878399999999, "r_y3": 101.10413000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 67.76786, "t": 124.39531999999997, "r": 85.231277, "b": 129.35253999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.76786, "r_y0": 129.35253999999998, "r_x1": 85.231277, "r_y1": 129.35253999999998, "r_x2": 85.231277, "r_y2": 124.39531999999997, "r_x3": 67.76786, "r_y3": 124.39531999999997, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 227.55121, "t": 102.53992000000005, "r": 249.80251, "b": 107.49712999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55121, "r_y0": 107.49712999999997, "r_x1": 249.80251, "r_y1": 107.49712999999997, "r_x2": 249.80251, "r_y2": 102.53992000000005, "r_x3": 227.55121, "r_y3": 102.53992000000005, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 232.19898999999998, "t": 126.98577999999986, "r": 249.66241, "b": 131.94299, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.19898999999998, "r_y0": 131.94299, "r_x1": 249.66241, "r_y1": 131.94299, "r_x2": 249.66241, "r_y2": 126.98577999999986, "r_x3": 232.19898999999998, "r_y3": 126.98577999999986, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 396.2337, "t": 114.04522999999995, "r": 413.69711, "b": 119.00243999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2337, "r_y0": 119.00243999999998, "r_x1": 413.69711, "r_y1": 119.00243999999998, "r_x2": 413.69711, "r_y2": 114.04522999999995, "r_x3": 396.2337, "r_y3": 114.04522999999995, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 97.382202, "t": 141.27617999999995, "r": 105.08014, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.382202, "r_y0": 146.23339999999996, "r_x1": 105.08014, "r_y1": 146.23339999999996, "r_x2": 105.08014, "r_y2": 141.27617999999995, "r_x3": 97.382202, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 60.93763400000001, "t": 85.73321999999996, "r": 76.151443, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.93763400000001, "r_y0": 90.69042999999999, "r_x1": 76.151443, "r_y1": 90.69042999999999, "r_x2": 76.151443, "r_y2": 85.73321999999996, "r_x3": 60.93763400000001, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 82.304901, "t": 86.22351000000003, "r": 106.99162, "b": 91.18073000000015, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.304901, "r_y0": 91.18073000000015, "r_x1": 106.99162, "r_y1": 91.18073000000015, "r_x2": 106.99162, "r_y2": 86.22351000000003, "r_x3": 82.304901, "r_y3": 86.22351000000003, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 246.20530999999997, "t": 141.60608000000002, "r": 281.88013, "b": 146.56329000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.20530999999997, "r_y0": 146.56329000000005, "r_x1": 281.88013, "r_y1": 146.56329000000005, "r_x2": 281.88013, "r_y2": 141.60608000000002, "r_x3": 246.20530999999997, "r_y3": 141.60608000000002, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 226.69780000000003, "t": 85.73321999999996, "r": 241.91161, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.69780000000003, "r_y0": 90.69042999999999, "r_x1": 241.91161, "r_y1": 90.69042999999999, "r_x2": 241.91161, "r_y2": 85.73321999999996, "r_x3": 226.69780000000003, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 249.93848999999997, "t": 86.08801000000005, "r": 282.49384, "b": 91.04522999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.93848999999997, "r_y0": 91.04522999999995, "r_x1": 282.49384, "r_y1": 91.04522999999995, "r_x2": 282.49384, "r_y2": 86.08801000000005, "r_x3": 249.93848999999997, "r_y3": 86.08801000000005, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 410.19409, "t": 141.27617999999995, "r": 444.68915, "b": 146.23339999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19409, "r_y0": 146.23339999999996, "r_x1": 444.68915, "r_y1": 146.23339999999996, "r_x2": 444.68915, "r_y2": 141.27617999999995, "r_x3": 410.19409, "r_y3": 141.27617999999995, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 391.37341, "t": 85.73321999999996, "r": 432.6716599999999, "b": 90.69042999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37341, "r_y0": 90.69042999999999, "r_x1": 432.6716599999999, "r_y1": 90.69042999999999, "r_x2": 432.6716599999999, "r_y2": 85.73321999999996, "r_x3": 391.37341, "r_y3": 85.73321999999996, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 435.60571000000004, "t": 86.26140999999996, "r": 445.62414999999993, "b": 91.21862999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.60571000000004, "r_y0": 91.21862999999996, "r_x1": 445.62414999999993, "r_y1": 91.21862999999996, "r_x2": 445.62414999999993, "r_y2": 86.26140999999996, "r_x3": 435.60571000000004, "r_y3": 86.26140999999996, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 113.94921, "t": 141.28845, "r": 136.20052, "b": 146.24567000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.94921, "r_y0": 146.24567000000002, "r_x1": 136.20052, "r_y1": 146.24567000000002, "r_x2": 136.20052, "r_y2": 141.28845, "r_x3": 113.94921, "r_y3": 141.28845, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 116.91554000000001, "t": 94.81853999999998, "r": 127.05433999999998, "b": 99.77575999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.91554000000001, "r_y0": 99.77575999999999, "r_x1": 127.05433999999998, "r_y1": 99.77575999999999, "r_x2": 127.05433999999998, "r_y2": 94.81853999999998, "r_x3": 116.91554000000001, "r_y3": 94.81853999999998, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 113.3146, "t": 100.93853999999999, "r": 127.05298, "b": 105.89575000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.3146, "r_y0": 105.89575000000002, "r_x1": 127.05298, "r_y1": 105.89575000000002, "r_x2": 127.05298, "r_y2": 100.93853999999999, "r_x3": 113.3146, "r_y3": 100.93853999999999, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 112.94112, "t": 107.05853000000013, "r": 127.05537, "b": 112.01575000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94112, "r_y0": 112.01575000000003, "r_x1": 127.05537, "r_y1": 112.01575000000003, "r_x2": 127.05537, "r_y2": 107.05853000000013, "r_x3": 112.94112, "r_y3": 107.05853000000013, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 113.22738999999999, "t": 122.61523, "r": 126.96577, "b": 127.57245, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.22738999999999, "r_y0": 127.57245, "r_x1": 126.96577, "r_y1": 127.57245, "r_x2": 126.96577, "r_y2": 122.61523, "r_x3": 113.22738999999999, "r_y3": 122.61523, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 112.85390000000001, "t": 128.73523, "r": 126.96814999999998, "b": 133.69244000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85390000000001, "r_y0": 133.69244000000003, "r_x1": 126.96814999999998, "r_y1": 133.69244000000003, "r_x2": 126.96814999999998, "r_y2": 128.73523, "r_x3": 112.85390000000001, "r_y3": 128.73523, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 138.57864, "t": 141.43640000000005, "r": 156.04207, "b": 146.39362000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.57864, "r_y0": 146.39362000000006, "r_x1": 156.04207, "r_y1": 146.39362000000006, "r_x2": 156.04207, "r_y2": 141.43640000000005, "r_x3": 138.57864, "r_y3": 141.43640000000005, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 122.03101, "t": 86.2713, "r": 151.04185, "b": 91.22852, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03101, "r_y0": 91.22852, "r_x1": 151.04185, "r_y1": 91.22852, "r_x2": 151.04185, "r_y2": 86.2713, "r_x3": 122.03101, "r_y3": 86.2713, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 311.65359, "t": 86.55498999999998, "r": 321.67203, "b": 91.5122100000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65359, "r_y0": 91.5122100000001, "r_x1": 321.67203, "r_y1": 91.5122100000001, "r_x2": 321.67203, "r_y2": 86.55498999999998, "r_x3": 311.65359, "r_y3": 86.55498999999998, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 287.89441, "t": 141.71063000000004, "r": 310.14572, "b": 146.66785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89441, "r_y0": 146.66785000000004, "r_x1": 310.14572, "r_y1": 146.66785000000004, "r_x2": 310.14572, "r_y2": 141.71063000000004, "r_x3": 287.89441, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.23572, "t": 93.07977000000005, "r": 299.37451, "b": 98.03698999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.23572, "r_y0": 98.03698999999995, "r_x1": 299.37451, "r_y1": 98.03698999999995, "r_x2": 299.37451, "r_y2": 93.07977000000005, "r_x3": 289.23572, "r_y3": 93.07977000000005, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 285.63513, "t": 99.19976999999994, "r": 299.3735, "b": 104.15698000000009, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63513, "r_y0": 104.15698000000009, "r_x1": 299.3735, "r_y1": 104.15698000000009, "r_x2": 299.3735, "r_y2": 99.19976999999994, "r_x3": 285.63513, "r_y3": 99.19976999999994, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 285.26111, "t": 105.31975999999997, "r": 299.37537, "b": 110.27697999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26111, "r_y0": 110.27697999999998, "r_x1": 299.37537, "r_y1": 110.27697999999998, "r_x2": 299.37537, "r_y2": 105.31975999999997, "r_x3": 285.26111, "r_y3": 105.31975999999997, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 285.43109, "t": 120.38995, "r": 299.16946, "b": 125.34717, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43109, "r_y0": 125.34717, "r_x1": 299.16946, "r_y1": 125.34717, "r_x2": 299.16946, "r_y2": 120.38995, "r_x3": 285.43109, "r_y3": 120.38995, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 285.05713, "t": 126.50995, "r": 299.17139, "b": 131.46716000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.05713, "r_y0": 131.46716000000004, "r_x1": 299.17139, "r_y1": 131.46716000000004, "r_x2": 299.17139, "r_y2": 126.50995, "r_x3": 285.05713, "r_y3": 126.50995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 311.34592, "t": 141.71063000000004, "r": 328.80933, "b": 146.66785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.34592, "r_y0": 146.66785000000004, "r_x1": 328.80933, "r_y1": 146.66785000000004, "r_x2": 328.80933, "r_y2": 141.71063000000004, "r_x3": 311.34592, "r_y3": 141.71063000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 299.58362, "t": 86.69353999999998, "r": 309.60205, "b": 91.65075999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58362, "r_y0": 91.65075999999999, "r_x1": 309.60205, "r_y1": 91.65075999999999, "r_x2": 309.60205, "r_y2": 86.69353999999998, "r_x3": 299.58362, "r_y3": 86.69353999999998, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 466.04077000000007, "t": 141.67169, "r": 483.50418, "b": 146.62891000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04077000000007, "r_y0": 146.62891000000002, "r_x1": 483.50418, "r_y1": 146.62891000000002, "r_x2": 483.50418, "r_y2": 141.67169, "r_x3": 466.04077000000007, "r_y3": 141.67169, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 459.02151, "t": 93.76116999999999, "r": 469.16031000000004, "b": 98.71838000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02151, "r_y0": 98.71838000000002, "r_x1": 469.16031000000004, "r_y1": 98.71838000000002, "r_x2": 469.16031000000004, "r_y2": 93.76116999999999, "r_x3": 459.02151, "r_y3": 93.76116999999999, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 455.4209, "t": 99.88116000000002, "r": 469.15927000000005, "b": 104.83838000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.4209, "r_y0": 104.83838000000003, "r_x1": 469.15927000000005, "r_y1": 104.83838000000003, "r_x2": 469.15927000000005, "r_y2": 99.88116000000002, "r_x3": 455.4209, "r_y3": 99.88116000000002, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 455.04691, "t": 106.00116000000014, "r": 469.16115999999994, "b": 110.95836999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.04691, "r_y0": 110.95836999999995, "r_x1": 469.16115999999994, "r_y1": 110.95836999999995, "r_x2": 469.16115999999994, "r_y2": 106.00116000000014, "r_x3": 455.04691, "r_y3": 106.00116000000014, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 467.39401, "t": 85.57239000000004, "r": 480.6545100000001, "b": 90.52959999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39401, "r_y0": 90.52959999999996, "r_x1": 480.6545100000001, "r_y1": 90.52959999999996, "r_x2": 480.6545100000001, "r_y2": 85.57239000000004, "r_x3": 467.39401, "r_y3": 85.57239000000004, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 160.37672, "t": 141.58385999999996, "r": 182.62802, "b": 146.54107999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37672, "r_y0": 146.54107999999997, "r_x1": 182.62802, "r_y1": 146.54107999999997, "r_x2": 182.62802, "r_y2": 141.58385999999996, "r_x3": 160.37672, "r_y3": 141.58385999999996, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 153.74265, "t": 94.86481000000003, "r": 173.32664, "b": 99.82201999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74265, "r_y0": 99.82201999999995, "r_x1": 173.32664, "r_y1": 99.82201999999995, "r_x2": 173.32664, "r_y2": 94.86481000000003, "r_x3": 153.74265, "r_y3": 94.86481000000003, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 154.50967, "t": 100.98479999999995, "r": 173.3246, "b": 105.94202000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50967, "r_y0": 105.94202000000007, "r_x1": 173.3246, "r_y1": 105.94202000000007, "r_x2": 173.3246, "r_y2": 100.98479999999995, "r_x3": 154.50967, "r_y3": 100.98479999999995, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 155.27162, "t": 107.10479999999995, "r": 173.32664, "b": 112.06200999999987, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27162, "r_y0": 112.06200999999987, "r_x1": 173.32664, "r_y1": 112.06200999999987, "r_x2": 173.32664, "r_y2": 107.10479999999995, "r_x3": 155.27162, "r_y3": 107.10479999999995, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.41302, "t": 107.23248000000001, "r": 345.99701, "b": 112.18970000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41302, "r_y0": 112.18970000000002, "r_x1": 345.99701, "r_y1": 112.18970000000002, "r_x2": 345.99701, "r_y2": 107.23248000000001, "r_x3": 326.41302, "r_y3": 107.23248000000001, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 327.17972, "t": 113.35248000000001, "r": 345.99463, "b": 118.30969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.17972, "r_y0": 118.30969000000005, "r_x1": 345.99463, "r_y1": 118.30969000000005, "r_x2": 345.99463, "r_y2": 113.35248000000001, "r_x3": 327.17972, "r_y3": 113.35248000000001, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 327.94131, "t": 119.47247000000004, "r": 345.99634, "b": 124.42969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94131, "r_y0": 124.42969000000005, "r_x1": 345.99634, "r_y1": 124.42969000000005, "r_x2": 345.99634, "r_y2": 119.47247000000004, "r_x3": 327.94131, "r_y3": 119.47247000000004, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 488.9942, "t": 104.15374999999983, "r": 508.76384999999993, "b": 109.11095999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.9942, "r_y0": 109.11095999999998, "r_x1": 508.76384999999993, "r_y1": 109.11095999999998, "r_x2": 508.76384999999993, "r_y2": 104.15374999999983, "r_x3": 488.9942, "r_y3": 104.15374999999983, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 490.1893, "t": 110.27373999999998, "r": 508.76349000000005, "b": 115.2309600000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.1893, "r_y0": 115.2309600000001, "r_x1": 508.76349000000005, "r_y1": 115.2309600000001, "r_x2": 508.76349000000005, "r_y2": 110.27373999999998, "r_x3": 490.1893, "r_y3": 110.27373999999998, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 489.72009, "t": 116.39373999999998, "r": 508.76758, "b": 121.35095000000013, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72009, "r_y0": 121.35095000000013, "r_x1": 508.76758, "r_y1": 121.35095000000013, "r_x2": 508.76758, "r_y2": 116.39373999999998, "r_x3": 489.72009, "r_y3": 116.39373999999998, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 490.71121, "t": 122.51373000000001, "r": 508.76624, "b": 127.47095000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71121, "r_y0": 127.47095000000002, "r_x1": 508.76624, "r_y1": 127.47095000000002, "r_x2": 508.76624, "r_y2": 122.51373000000001, "r_x3": 490.71121, "r_y3": 122.51373000000001, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 185.37759, "t": 141.71118, "r": 202.84102, "b": 146.66840000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.37759, "r_y0": 146.66840000000002, "r_x1": 202.84102, "r_y1": 146.66840000000002, "r_x2": 202.84102, "r_y2": 141.71118, "r_x3": 185.37759, "r_y3": 141.71118, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 168.50357, "t": 86.13611000000003, "r": 197.52699, "b": 91.09331999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.50357, "r_y0": 91.09331999999995, "r_x1": 197.52699, "r_y1": 91.09331999999995, "r_x2": 197.52699, "r_y2": 86.13611000000003, "r_x3": 168.50357, "r_y3": 86.13611000000003, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 357.3768, "t": 85.99707000000001, "r": 367.39523, "b": 90.95428000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.3768, "r_y0": 90.95428000000004, "r_x1": 367.39523, "r_y1": 90.95428000000004, "r_x2": 367.39523, "r_y2": 85.99707000000001, "r_x3": 357.3768, "r_y3": 85.99707000000001, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 333.73151, "t": 141.62323000000004, "r": 374.92862, "b": 146.58043999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73151, "r_y0": 146.58043999999995, "r_x1": 374.92862, "r_y1": 146.58043999999995, "r_x2": 374.92862, "r_y2": 141.62323000000004, "r_x3": 333.73151, "r_y3": 141.62323000000004, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 345.69101, "t": 86.05591000000004, "r": 355.70944, "b": 91.01312000000007, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69101, "r_y0": 91.01312000000007, "r_x1": 355.70944, "r_y1": 91.01312000000007, "r_x2": 355.70944, "r_y2": 86.05591000000004, "r_x3": 345.69101, "r_y3": 86.05591000000004, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 508.54248, "t": 141.37683000000004, "r": 526.00592, "b": 146.33405000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54248, "r_y0": 146.33405000000005, "r_x1": 526.00592, "r_y1": 146.33405000000005, "r_x2": 526.00592, "r_y2": 141.37683000000004, "r_x3": 508.54248, "r_y3": 141.37683000000004, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 510.44653000000005, "t": 86.09258999999986, "r": 523.70703, "b": 91.0498, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.44653000000005, "r_y0": 91.0498, "r_x1": 523.70703, "r_y1": 91.0498, "r_x2": 523.70703, "r_y2": 86.09258999999986, "r_x3": 510.44653000000005, "r_y3": 86.09258999999986, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 50.112, "t": 165.50238000000002, "r": 545.11371, "b": 186.36395000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9661495685577393, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 174.40894000000003, "r_x1": 545.11371, "r_y1": 174.40894000000003, "r_x2": 545.11371, "r_y2": 165.50238000000002, "r_x3": 50.112, "r_y3": 165.50238000000002, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 186.36395000000005, "r_x1": 513.52234, "r_y1": 186.36395000000005, "r_x2": 513.52234, "r_y2": 177.4574, "r_x3": 50.112, "r_y3": 177.4574, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity." }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 61.569, "t": 210.93140000000005, "r": 286.36511, "b": 231.79296999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9621952772140503, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 219.83794999999998, "r_x1": 71.14743, "r_y1": 219.83794999999998, "r_x2": 71.14743, "r_y2": 210.93140000000005, "r_x3": 61.569, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.542038, "r_y0": 219.83794999999998, "r_x1": 286.36511, "r_y1": 219.83794999999998, "r_x2": 286.36511, "r_y2": 210.93140000000005, "r_x3": 73.542038, "r_y3": 210.93140000000005, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 231.79296999999997, "r_x1": 87.47155, "r_y1": 231.79296999999997, "r_x2": 87.47155, "r_y2": 222.88640999999996, "r_x3": 70.037003, "r_y3": 222.88640999999996, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 TableFormer output does not include the table cell content." }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 61.569, "t": 244.07141000000001, "r": 286.36514, "b": 264.93298000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9629555344581604, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.569, "r_y0": 252.97797000000003, "r_x1": 71.345718, "r_y1": 252.97797000000003, "r_x2": 71.345718, "r_y2": 244.07141000000001, "r_x3": 61.569, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.789902, "r_y0": 252.97797000000003, "r_x1": 286.36514, "r_y1": 252.97797000000003, "r_x2": 286.36514, "r_y2": 244.07141000000001, "r_x3": 73.789902, "r_y3": 244.07141000000001, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.037003, "r_y0": 264.93298000000004, "r_x1": 150.41524, "r_y1": 264.93298000000004, "r_x2": 150.41524, "r_y2": 256.02643, "r_x3": 70.037003, "r_y3": 256.02643, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.112, "t": 279.20343, "r": 286.36511, "b": 395.70688, "coord_origin": "TOPLEFT" }, "confidence": 0.9767085909843445, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 288.10999, "r_x1": 286.36499, "r_y1": 288.10999, "r_x2": 286.36499, "r_y2": 279.20343, "r_x3": 62.067001, "r_y3": 279.20343, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 300.06497, "r_x1": 286.36505, "r_y1": 300.06497, "r_x2": 286.36505, "r_y2": 291.15842, "r_x3": 50.112, "r_y3": 291.15842, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 312.01996, "r_x1": 286.36511, "r_y1": 312.01996, "r_x2": 286.36511, "r_y2": 303.1134, "r_x3": 50.112, "r_y3": 303.1134, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 323.97495, "r_x1": 286.36511, "r_y1": 323.97495, "r_x2": 286.36511, "r_y2": 315.06839, "r_x3": 50.112, "r_y3": 315.06839, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 335.93093999999996, "r_x1": 286.36511, "r_y1": 335.93093999999996, "r_x2": 286.36511, "r_y2": 327.02438, "r_x3": 50.112, "r_y3": 327.02438, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 347.88593, "r_x1": 286.36505, "r_y1": 347.88593, "r_x2": 286.36505, "r_y2": 338.97937, "r_x3": 50.112, "r_y3": 338.97937, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 359.84091, "r_x1": 286.36508, "r_y1": 359.84091, "r_x2": 286.36508, "r_y2": 350.93436, "r_x3": 50.112, "r_y3": 350.93436, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 371.7959, "r_x1": 286.36511, "r_y1": 371.7959, "r_x2": 286.36511, "r_y2": 362.88934, "r_x3": 50.112, "r_y3": 362.88934, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 383.75089, "r_x1": 286.36508, "r_y1": 383.75089, "r_x2": 286.36508, "r_y2": 374.84433000000007, "r_x3": 50.112, "r_y3": 374.84433000000007, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 395.70688, "r_x1": 154.55988, "r_y1": 395.70688, "r_x2": 154.55988, "r_y2": 386.80032, "r_x3": 50.112, "r_y3": 386.80032, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes." }, { "label": "text", "id": 11, "page_no": 11, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.112, "t": 399.06934, "r": 286.36496, "b": 419.93188, "coord_origin": "TOPLEFT" }, "confidence": 0.934766411781311, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 407.97589, "r_x1": 286.36496, "r_y1": 407.97589, "r_x2": 286.36496, "r_y2": 399.06934, "r_x3": 62.067001, "r_y3": 399.06934, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 419.93188, "r_x1": 95.491638, "r_y1": 419.93188, "r_x2": 95.491638, "r_y2": 411.02533, "r_x3": 50.112, "r_y3": 411.02533, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Here is a step-by-step description of the prediction postprocessing:" }, { "label": "list_item", "id": 20, "page_no": 11, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 50.112, "t": 423.29532, "r": 286.36508, "b": 456.11185000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.8280702233314514, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 432.20187, "r_x1": 69.37281, "r_y1": 432.20187, "r_x2": 69.37281, "r_y2": 423.29532, "r_x3": 62.067001, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.808075, "r_y0": 432.20187, "r_x1": 286.36502, "r_y1": 432.20187, "r_x2": 286.36502, "r_y2": 423.29532, "r_x3": 71.808075, "r_y3": 423.29532, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 444.15686, "r_x1": 286.36508, "r_y1": 444.15686, "r_x2": 286.36508, "r_y2": 435.25031, "r_x3": 50.112, "r_y3": 435.25031, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 456.11185000000006, "r_x1": 274.50958, "r_y1": 456.11185000000006, "r_x2": 274.50958, "r_y2": 447.20529, "r_x3": 50.112, "r_y3": 447.20529, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure." }, { "label": "list_item", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.112, "t": 459.47528, "r": 286.36505, "b": 504.2468, "coord_origin": "TOPLEFT" }, "confidence": 0.9646760821342468, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 468.38184, "r_x1": 69.538948, "r_y1": 468.38184, "r_x2": 69.538948, "r_y2": 459.47528, "r_x3": 62.067001, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.429329, "r_y0": 468.38184, "r_x1": 286.36499, "r_y1": 468.38184, "r_x2": 286.36499, "r_y2": 459.47528, "r_x3": 77.429329, "r_y3": 459.47528, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 480.33682, "r_x1": 286.36505, "r_y1": 480.33682, "r_x2": 286.36505, "r_y2": 471.43027, "r_x3": 50.112, "r_y3": 471.43027, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 492.29181, "r_x1": 286.36505, "r_y1": 492.29181, "r_x2": 286.36505, "r_y2": 483.38525, "r_x3": 50.112, "r_y3": 483.38525, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 504.2468, "r_x1": 110.70452999999999, "r_y1": 504.2468, "r_x2": 110.70452999999999, "r_y2": 495.34024, "r_x3": 50.112, "r_y3": 495.34024, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches." }, { "label": "list_item", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.112, "t": 507.61023, "r": 286.36493, "b": 528.4727800000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9391399025917053, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 516.5167799999999, "r_x1": 69.863068, "r_y1": 516.5167799999999, "r_x2": 69.863068, "r_y2": 507.61023, "r_x3": 62.067001, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.461754, "r_y0": 516.5167799999999, "r_x1": 286.36493, "r_y1": 516.5167799999999, "r_x2": 286.36493, "r_y2": 507.61023, "r_x3": 72.461754, "r_y3": 507.61023, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 528.4727800000001, "r_x1": 226.0714, "r_y1": 528.4727800000001, "r_x2": 226.0714, "r_y2": 519.5662199999999, "r_x3": 50.112, "r_y3": 519.5662199999999, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones." }, { "label": "list_item", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.112, "t": 531.83521, "r": 286.36511, "b": 564.65277, "coord_origin": "TOPLEFT" }, "confidence": 0.9491708874702454, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 540.7417800000001, "r_x1": 286.36496, "r_y1": 540.7417800000001, "r_x2": 286.36496, "r_y2": 531.83521, "r_x3": 62.067001, "r_y3": 531.83521, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 552.69777, "r_x1": 286.36511, "r_y1": 552.69777, "r_x2": 286.36511, "r_y2": 543.79121, "r_x3": 50.112, "r_y3": 543.79121, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 564.65277, "r_x1": 114.03204, "r_y1": 564.65277, "r_x2": 114.03204, "r_y2": 555.74622, "r_x3": 50.112, "r_y3": 555.74622, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column." }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.112, "t": 568.01622, "r": 286.36508, "b": 600.83278, "coord_origin": "TOPLEFT" }, "confidence": 0.9587163329124451, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 576.92278, "r_x1": 69.538948, "r_y1": 576.92278, "r_x2": 69.538948, "r_y2": 568.01622, "r_x3": 62.067001, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.731949, "r_y0": 576.92278, "r_x1": 286.36502, "r_y1": 576.92278, "r_x2": 286.36502, "r_y2": 568.01622, "r_x3": 76.731949, "r_y3": 568.01622, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 588.87778, "r_x1": 286.36508, "r_y1": 588.87778, "r_x2": 286.36508, "r_y2": 579.97122, "r_x3": 50.112, "r_y3": 579.97122, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 600.83278, "r_x1": 278.70383, "r_y1": 600.83278, "r_x2": 278.70383, "r_y2": 591.9262200000001, "r_x3": 50.112, "r_y3": 591.9262200000001, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:" }, { "label": "formula", "id": 12, "page_no": 11, "cluster": { "id": 12, "label": "formula", "bbox": { "l": 110.70499, "t": 623.43591, "r": 286.3624, "b": 654.1056100000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9298412799835205, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.02799999999999, "r_y0": 632.84061, "r_x1": 157.9516, "r_y1": 632.84061, "r_x2": 157.9516, "r_y2": 623.99382, "r_x3": 112.02799999999999, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.715, "r_y0": 632.84061, "r_x1": 203.4964, "r_y1": 632.84061, "r_x2": 203.4964, "r_y2": 623.99382, "r_x3": 160.715, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58499, "r_y0": 640.17578, "r_x1": 189.14511, "r_y1": 640.17578, "r_x2": 189.14511, "r_y2": 633.98305, "r_x3": 185.58499, "r_y3": 633.98305, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.49899, "r_y0": 632.84061, "r_x1": 208.48029, "r_y1": 632.84061, "r_x2": 208.48029, "r_y2": 623.43591, "r_x3": 203.49899, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48099, "r_y0": 632.84061, "r_x1": 220.28911, "r_y1": 632.84061, "r_x2": 220.28911, "r_y2": 623.99382, "r_x3": 208.48099, "r_y3": 623.99382, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.78699, "r_y0": 632.84061, "r_x1": 225.76828, "r_y1": 632.84061, "r_x2": 225.76828, "r_y2": 623.43591, "r_x3": 220.78699, "r_y3": 623.43591, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.70499, "r_y0": 654.1056100000001, "r_x1": 122.51310999999998, "r_y1": 654.1056100000001, "r_x2": 122.51310999999998, "r_y2": 645.25882, "r_x3": 110.70499, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.77899000000001, "r_y0": 654.1056100000001, "r_x1": 133.52791, "r_y1": 654.1056100000001, "r_x2": 133.52791, "r_y2": 645.25882, "r_x3": 125.77899000000001, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.295, "r_y0": 654.1056100000001, "r_x1": 156.00201, "r_y1": 654.1056100000001, "r_x2": 156.00201, "r_y2": 645.25882, "r_x3": 136.295, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.00299, "r_y0": 654.1056100000001, "r_x1": 160.98428, "r_y1": 654.1056100000001, "r_x2": 160.98428, "r_y2": 644.70091, "r_x3": 156.00299, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98399, "r_y0": 654.1056100000001, "r_x1": 170.23811, "r_y1": 654.1056100000001, "r_x2": 170.23811, "r_y2": 645.25882, "r_x3": 160.98399, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.73599, "r_y0": 654.1056100000001, "r_x1": 185.6779, "r_y1": 654.1056100000001, "r_x2": 185.6779, "r_y2": 644.70091, "r_x3": 170.73599, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.894, "r_y0": 654.1056100000001, "r_x1": 206.05283, "r_y1": 654.1056100000001, "r_x2": 206.05283, "r_y2": 645.25882, "r_x3": 187.894, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.054, "r_y0": 654.1056100000001, "r_x1": 211.03529, "r_y1": 654.1056100000001, "r_x2": 211.03529, "r_y2": 644.70091, "r_x3": 206.054, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.035, "r_y0": 654.1056100000001, "r_x1": 220.28912, "r_y1": 654.1056100000001, "r_x2": 220.28912, "r_y2": 645.25882, "r_x3": 211.035, "r_y3": 645.25882, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.787, "r_y0": 654.1056100000001, "r_x1": 225.76829999999998, "r_y1": 654.1056100000001, "r_x2": 225.76829999999998, "r_y2": 644.70091, "r_x3": 220.787, "r_y3": 644.70091, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.746, "r_y0": 643.79178, "r_x1": 286.3624, "r_y1": 643.79178, "r_x2": 286.3624, "r_y2": 634.88522, "r_x3": 274.746, "r_y3": 634.88522, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)" }, { "label": "text", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.112, "t": 667.3479199999999, "r": 286.362, "b": 688.92679, "coord_origin": "TOPLEFT" }, "confidence": 0.9545555114746094, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 676.97179, "r_x1": 74.45063, "r_y1": 676.97179, "r_x2": 74.45063, "r_y2": 668.06522, "r_x3": 50.112, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.335999, "r_y0": 676.75261, "r_x1": 82.647812, "r_y1": 676.75261, "r_x2": 82.647812, "r_y2": 667.90582, "r_x3": 78.335999, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.532997, "r_y0": 676.97179, "r_x1": 123.63372, "r_y1": 676.97179, "r_x2": 123.63372, "r_y2": 668.06522, "r_x3": 86.532997, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.51899999999999, "r_y0": 676.75261, "r_x1": 132.50029, "r_y1": 676.75261, "r_x2": 132.50029, "r_y2": 667.3479199999999, "r_x3": 127.51899999999999, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.50099, "r_y0": 676.97179, "r_x1": 210.69743, "r_y1": 676.97179, "r_x2": 210.69743, "r_y2": 668.06522, "r_x3": 132.50099, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.69699, "r_y0": 676.75261, "r_x1": 215.67828, "r_y1": 676.75261, "r_x2": 215.67828, "r_y2": 667.3479199999999, "r_x3": 210.69699, "r_y3": 667.3479199999999, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56299, "r_y0": 676.97179, "r_x1": 233.94897000000003, "r_y1": 676.97179, "r_x2": 233.94897000000003, "r_y2": 668.06522, "r_x3": 219.56299, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83499000000003, "r_y0": 676.75261, "r_x1": 247.08911, "r_y1": 676.75261, "r_x2": 247.08911, "r_y2": 667.90582, "r_x3": 237.83499000000003, "r_y3": 667.90582, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47299000000004, "r_y0": 676.97179, "r_x1": 286.362, "r_y1": 676.97179, "r_x2": 286.362, "r_y2": 668.06522, "r_x3": 251.47299000000004, "r_y3": 668.06522, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 688.92679, "r_x1": 205.88721, "r_y1": 688.92679, "r_x2": 205.88721, "r_y2": 680.02022, "r_x3": 50.112, "r_y3": 680.02022, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point." }, { "label": "list_item", "id": 13, "page_no": 11, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.112, "t": 692.290222, "r": 286.36496, "b": 713.151787, "coord_origin": "TOPLEFT" }, "confidence": 0.9260510206222534, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 701.196785, "r_x1": 69.538948, "r_y1": 701.196785, "r_x2": 69.538948, "r_y2": 692.290222, "r_x3": 62.067001, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.273666, "r_y0": 701.196785, "r_x1": 286.36496, "r_y1": 701.196785, "r_x2": 286.36496, "r_y2": 692.290222, "r_x3": 76.273666, "r_y3": 692.290222, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 713.151787, "r_x1": 94.604973, "r_y1": 713.151787, "r_x2": 94.604973, "r_y2": 704.245224, "r_x3": 50.112, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.598999, "r_y0": 712.93261, "r_x1": 103.29263, "r_y1": 712.93261, "r_x2": 103.29263, "r_y2": 704.085815, "r_x3": 97.598999, "r_y3": 704.085815, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.292, "r_y0": 713.151787, "r_x1": 286.36481, "r_y1": 713.151787, "r_x2": 286.36481, "r_y2": 704.245224, "r_x3": 103.292, "r_y3": 704.245224, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-" }, { "label": "text", "id": 16, "page_no": 11, "cluster": { "id": 16, "label": "text", "bbox": { "l": 308.862, "t": 210.93120999999996, "r": 545.11517, "b": 255.7038, "coord_origin": "TOPLEFT" }, "confidence": 0.8942298889160156, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 219.83776999999998, "r_x1": 545.11517, "r_y1": 219.83776999999998, "r_x2": 545.11517, "r_y2": 210.93120999999996, "r_x3": 308.862, "r_y3": 210.93120999999996, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 231.79376000000002, "r_x1": 545.11511, "r_y1": 231.79376000000002, "r_x2": 545.11511, "r_y2": 222.88720999999998, "r_x3": 308.862, "r_y3": 222.88720999999998, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 243.74878, "r_x1": 545.11511, "r_y1": 243.74878, "r_x2": 545.11511, "r_y2": 234.84222, "r_x3": 308.862, "r_y3": 234.84222, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 255.7038, "r_x1": 339.57669, "r_y1": 255.7038, "r_x2": 339.57669, "r_y2": 246.79724, "r_x3": 308.862, "r_y3": 246.79724, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal." }, { "label": "list_item", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.862, "t": 259.10222999999996, "r": 545.11499, "b": 279.96380999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9423392415046692, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81699, "r_y0": 268.00879, "r_x1": 328.28894, "r_y1": 268.00879, "r_x2": 328.28894, "r_y2": 259.10222999999996, "r_x3": 320.81699, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88419, "r_y0": 268.00879, "r_x1": 545.11499, "r_y1": 268.00879, "r_x2": 545.11499, "r_y2": 259.10222999999996, "r_x3": 334.88419, "r_y3": 259.10222999999996, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 279.96380999999997, "r_x1": 338.19189, "r_y1": 279.96380999999997, "r_x2": 338.19189, "r_y2": 271.05724999999995, "r_x3": 308.862, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68201, "r_y0": 279.74463000000003, "r_x1": 346.37564, "r_y1": 279.74463000000003, "r_x2": 346.37564, "r_y2": 270.89783, "r_x3": 340.68201, "r_y3": 270.89783, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37601, "r_y0": 279.96380999999997, "r_x1": 453.72305000000006, "r_y1": 279.96380999999997, "r_x2": 453.72305000000006, "r_y2": 271.05724999999995, "r_x3": 346.37601, "r_y3": 271.05724999999995, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes." }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86203, "t": 283.36325000000005, "r": 545.11511, "b": 387.91071, "coord_origin": "TOPLEFT" }, "confidence": 0.9562004804611206, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 292.26981, "r_x1": 328.38953, "r_y1": 292.26981, "r_x2": 328.38953, "r_y2": 283.36325000000005, "r_x3": 320.81702, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.9137, "r_y0": 292.26981, "r_x1": 545.11499, "r_y1": 292.26981, "r_x2": 545.11499, "r_y2": 283.36325000000005, "r_x3": 330.9137, "r_y3": 283.36325000000005, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 304.22479, "r_x1": 545.11511, "r_y1": 304.22479, "r_x2": 545.11511, "r_y2": 295.31824, "r_x3": 308.86203, "r_y3": 295.31824, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 316.17978, "r_x1": 545.11505, "r_y1": 316.17978, "r_x2": 545.11505, "r_y2": 307.27322, "r_x3": 308.86203, "r_y3": 307.27322, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 328.13477, "r_x1": 545.11511, "r_y1": 328.13477, "r_x2": 545.11511, "r_y2": 319.22821000000005, "r_x3": 308.86203, "r_y3": 319.22821000000005, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 340.09076000000005, "r_x1": 397.19043, "r_y1": 340.09076000000005, "r_x2": 397.19043, "r_y2": 331.1842, "r_x3": 308.86203, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.65616, "r_y0": 340.09076000000005, "r_x1": 545.11511, "r_y1": 340.09076000000005, "r_x2": 545.11511, "r_y2": 331.1842, "r_x3": 403.65616, "r_y3": 331.1842, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 352.04575, "r_x1": 545.11511, "r_y1": 352.04575, "r_x2": 545.11511, "r_y2": 343.13919, "r_x3": 308.86203, "r_y3": 343.13919, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 364.00073, "r_x1": 545.11505, "r_y1": 364.00073, "r_x2": 545.11505, "r_y2": 355.09418, "r_x3": 308.86203, "r_y3": 355.09418, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 375.95572000000004, "r_x1": 545.11505, "r_y1": 375.95572000000004, "r_x2": 545.11505, "r_y2": 367.04916, "r_x3": 308.86203, "r_y3": 367.04916, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 387.91071, "r_x1": 329.61414, "r_y1": 387.91071, "r_x2": 329.61414, "r_y2": 379.00415, "r_x3": 308.86203, "r_y3": 379.00415, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells." }, { "label": "list_item", "id": 17, "page_no": 11, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 308.86203, "t": 391.31015, "r": 545.11517, "b": 459.99164, "coord_origin": "TOPLEFT" }, "confidence": 0.8719939589500427, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 400.2167099999999, "r_x1": 328.55356, "r_y1": 400.2167099999999, "r_x2": 328.55356, "r_y2": 391.31015, "r_x3": 320.81702, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13242, "r_y0": 400.2167099999999, "r_x1": 545.11505, "r_y1": 400.2167099999999, "r_x2": 545.11505, "r_y2": 391.31015, "r_x3": 331.13242, "r_y3": 391.31015, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 412.17169, "r_x1": 545.11517, "r_y1": 412.17169, "r_x2": 545.11517, "r_y2": 403.26514, "r_x3": 308.86203, "r_y3": 403.26514, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 424.12668, "r_x1": 545.11511, "r_y1": 424.12668, "r_x2": 545.11511, "r_y2": 415.22012000000007, "r_x3": 308.86203, "r_y3": 415.22012000000007, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 436.0816699999999, "r_x1": 545.11511, "r_y1": 436.0816699999999, "r_x2": 545.11511, "r_y2": 427.17511, "r_x3": 308.86203, "r_y3": 427.17511, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 448.03665, "r_x1": 545.11505, "r_y1": 448.03665, "r_x2": 545.11505, "r_y2": 439.1301, "r_x3": 308.86203, "r_y3": 439.1301, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 459.99164, "r_x1": 426.18161, "r_y1": 459.99164, "r_x2": 426.18161, "r_y2": 451.08507999999995, "r_x3": 308.86203, "r_y3": 451.08507999999995, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score." }, { "label": "list_item", "id": 15, "page_no": 11, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.86203, "t": 463.39108, "r": 545.11517, "b": 567.93858, "coord_origin": "TOPLEFT" }, "confidence": 0.9126082062721252, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 472.29764, "r_x1": 328.67316, "r_y1": 472.29764, "r_x2": 328.67316, "r_y2": 463.39108, "r_x3": 320.81702, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29187, "r_y0": 472.29764, "r_x1": 545.11499, "r_y1": 472.29764, "r_x2": 545.11499, "r_y2": 463.39108, "r_x3": 331.29187, "r_y3": 463.39108, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 484.25262, "r_x1": 545.11505, "r_y1": 484.25262, "r_x2": 545.11505, "r_y2": 475.34607, "r_x3": 308.86203, "r_y3": 475.34607, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 496.20761, "r_x1": 545.11517, "r_y1": 496.20761, "r_x2": 545.11517, "r_y2": 487.30106, "r_x3": 308.86203, "r_y3": 487.30106, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 508.1626, "r_x1": 381.89786, "r_y1": 508.1626, "r_x2": 381.89786, "r_y2": 499.25604, "r_x3": 308.86203, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7023, "r_y0": 508.1626, "r_x1": 545.11517, "r_y1": 508.1626, "r_x2": 545.11517, "r_y2": 499.25604, "r_x3": 388.7023, "r_y3": 499.25604, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 520.11859, "r_x1": 545.11511, "r_y1": 520.11859, "r_x2": 545.11511, "r_y2": 511.21204, "r_x3": 308.86203, "r_y3": 511.21204, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 532.07358, "r_x1": 545.11505, "r_y1": 532.07358, "r_x2": 545.11505, "r_y2": 523.16702, "r_x3": 308.86203, "r_y3": 523.16702, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 544.02858, "r_x1": 545.11499, "r_y1": 544.02858, "r_x2": 545.11499, "r_y2": 535.12201, "r_x3": 308.86203, "r_y3": 535.12201, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 555.98358, "r_x1": 545.11517, "r_y1": 555.98358, "r_x2": 545.11517, "r_y2": 547.07703, "r_x3": 308.86203, "r_y3": 547.07703, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 567.93858, "r_x1": 442.22147000000007, "r_y1": 567.93858, "r_x2": 442.22147000000007, "r_y2": 559.03203, "r_x3": 308.86203, "r_y3": 559.03203, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan." }, { "label": "text", "id": 19, "page_no": 11, "cluster": { "id": 19, "label": "text", "bbox": { "l": 308.86203, "t": 571.33803, "r": 545.11688, "b": 604.15459, "coord_origin": "TOPLEFT" }, "confidence": 0.8459473848342896, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81702, "r_y0": 580.24458, "r_x1": 545.11493, "r_y1": 580.24458, "r_x2": 545.11493, "r_y2": 571.33803, "r_x3": 320.81702, "r_y3": 571.33803, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86203, "r_y0": 592.19958, "r_x1": 471.64093, "r_y1": 592.19958, "r_x2": 471.64093, "r_y2": 583.29303, "r_x3": 308.86203, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83405, "r_y0": 591.98041, "r_x1": 479.71872, "r_y1": 591.98041, "r_x2": 479.71872, "r_y2": 583.1336200000001, "r_x3": 474.83405, "r_y3": 583.1336200000001, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.26903999999996, "r_y0": 592.19958, "r_x1": 545.11688, "r_y1": 592.19958, "r_x2": 545.11688, "r_y2": 583.29303, "r_x3": 483.26903999999996, "r_y3": 583.29303, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 604.15459, "r_x1": 329.91306, "r_y1": 604.15459, "r_x2": 329.91306, "r_y2": 595.24803, "r_x3": 308.86206, "r_y3": 595.24803, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)." }, { "label": "list_item", "id": 21, "page_no": 11, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.86206, "t": 607.55304, "r": 545.11505, "b": 628.4155900000001, "coord_origin": "TOPLEFT" }, "confidence": 0.7716891169548035, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 616.4595899999999, "r_x1": 332.8718, "r_y1": 616.4595899999999, "r_x2": 332.8718, "r_y2": 607.55304, "r_x3": 320.81705, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.92532, "r_y0": 616.4595899999999, "r_x1": 545.11505, "r_y1": 616.4595899999999, "r_x2": 545.11505, "r_y2": 607.55304, "r_x3": 339.92532, "r_y3": 607.55304, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 628.4155900000001, "r_x1": 495.2923, "r_y1": 628.4155900000001, "r_x2": 495.2923, "r_y2": 619.50903, "r_x3": 308.86206, "r_y3": 619.50903, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row." }, { "label": "list_item", "id": 18, "page_no": 11, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.86206, "t": 631.81403, "r": 545.11505, "b": 664.63059, "coord_origin": "TOPLEFT" }, "confidence": 0.8584907054901123, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 640.72058, "r_x1": 545.11505, "r_y1": 640.72058, "r_x2": 545.11505, "r_y2": 631.81403, "r_x3": 320.81705, "r_y3": 631.81403, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 652.67558, "r_x1": 455.28238, "r_y1": 652.67558, "r_x2": 455.28238, "r_y2": 643.7690299999999, "r_x3": 308.86206, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.77704, "r_y0": 652.45641, "r_x1": 463.47067, "r_y1": 652.45641, "r_x2": 463.47067, "r_y2": 643.60962, "r_x3": 457.77704, "r_y3": 643.60962, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97104, "r_y0": 652.67558, "r_x1": 545.11389, "r_y1": 652.67558, "r_x2": 545.11389, "r_y2": 643.7690299999999, "r_x3": 465.97104, "r_y3": 643.7690299999999, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 664.63059, "r_x1": 332.38376, "r_y1": 664.63059, "r_x2": 332.38376, "r_y2": 655.72403, "r_x3": 308.86206, "r_y3": 655.72403, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)." }, { "label": "list_item", "id": 22, "page_no": 11, "cluster": { "id": 22, "label": "list_item", "bbox": { "l": 308.86206, "t": 668.03003, "r": 545.11499, "b": 688.89159, "coord_origin": "TOPLEFT" }, "confidence": 0.7590745091438293, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 676.93659, "r_x1": 545.11499, "r_y1": 676.93659, "r_x2": 545.11499, "r_y2": 668.03003, "r_x3": 320.81705, "r_y3": 668.03003, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 688.89159, "r_x1": 510.5848700000001, "r_y1": 688.89159, "r_x2": 510.5848700000001, "r_y2": 679.98503, "r_x3": 308.86206, "r_y3": 679.98503, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column." }, { "label": "list_item", "id": 25, "page_no": 11, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 308.86206, "t": 692.290024, "r": 545.11517, "b": 713.151596, "coord_origin": "TOPLEFT" }, "confidence": 0.6971189975738525, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.81705, "r_y0": 701.196594, "r_x1": 545.11505, "r_y1": 701.196594, "r_x2": 545.11505, "r_y2": 692.290024, "r_x3": 320.81705, "r_y3": 692.290024, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86206, "r_y0": 713.151596, "r_x1": 545.11517, "r_y1": 713.151596, "r_x2": 545.11517, "r_y2": 704.245026, "r_x3": 308.86206, "r_y3": 704.245026, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-" } ], "headers": [ { "label": "page_footer", "id": 14, "page_no": 11, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 292.63107, "t": 734.13303, "r": 302.59366, "b": 743.039593, "coord_origin": "TOPLEFT" }, "confidence": 0.9126598238945007, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63107, "r_y0": 743.039593, "r_x1": 302.59366, "r_y1": 743.039593, "r_x2": 302.59366, "r_y2": 734.13303, "r_x3": 292.63107, "r_y3": 734.13303, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" } ] } }, { "page_no": 12, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 88.846588, "r_y1": 84.11492999999996, "r_x2": 88.846588, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.06994999999995, "r_x1": 286.36496, "r_y1": 96.06994999999995, "r_x2": 286.36496, "r_y2": 87.16339000000005, "r_x3": 62.067001, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 127.03322, "r_y1": 108.02495999999985, "r_x2": 127.03322, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 119.7508499999999, "r_x1": 286.36499, "r_y1": 119.7508499999999, "r_x2": 286.36499, "r_y2": 111.16309000000001, "r_x3": 62.067001, "r_y3": 111.16309000000001, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.70587, "r_x1": 234.06139999999996, "r_y1": 131.70587, "r_x2": 234.06139999999996, "r_y2": 123.11810000000003, "r_x3": 50.112, "r_y3": 123.11810000000003, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.341, "r_y0": 510.96292, "r_x1": 273.13342, "r_y1": 510.96292, "r_x2": 273.13342, "r_y2": 502.05637, "r_x3": 63.341, "r_y3": 502.05637, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 315.50491, "r_x1": 345.63397, "r_y1": 315.50491, "r_x2": 345.63397, "r_y2": 306.59836, "r_x3": 308.862, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.78711, "r_y0": 315.50491, "r_x1": 545.11511, "r_y1": 315.50491, "r_x2": 545.11511, "r_y2": 306.59836, "r_x3": 352.78711, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 327.45990000000006, "r_x1": 355.89545, "r_y1": 327.45990000000006, "r_x2": 355.89545, "r_y2": 318.55334, "r_x3": 308.862, "r_y3": 318.55334, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34299, "r_y0": 689.39993, "r_x1": 541.63232, "r_y1": 689.39993, "r_x2": 541.63232, "r_y2": 680.4933599999999, "r_x3": 312.34299, "r_y3": 680.4933599999999, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 14, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 88.846588, "b": 84.11492999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.7545598149299622, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 88.846588, "r_y1": 84.11492999999996, "r_x2": 88.846588, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.112, "t": 87.16339000000005, "r": 286.36496, "b": 108.02495999999985, "coord_origin": "TOPLEFT" }, "confidence": 0.9170762300491333, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.06994999999995, "r_x1": 286.36496, "r_y1": 96.06994999999995, "r_x2": 286.36496, "r_y2": 87.16339000000005, "r_x3": 62.067001, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 127.03322, "r_y1": 108.02495999999985, "r_x2": 127.03322, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 111.16309000000001, "r": 286.36499, "b": 131.70587, "coord_origin": "TOPLEFT" }, "confidence": 0.9454683065414429, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 119.7508499999999, "r_x1": 286.36499, "r_y1": 119.7508499999999, "r_x2": 286.36499, "r_y2": 111.16309000000001, "r_x3": 62.067001, "r_y3": 111.16309000000001, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.70587, "r_x1": 234.06139999999996, "r_y1": 131.70587, "r_x2": 234.06139999999996, "r_y2": 123.11810000000003, "r_x3": 50.112, "r_y3": 123.11810000000003, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "caption", "bbox": { "l": 63.341, "t": 502.05637, "r": 273.13342, "b": 510.96292, "coord_origin": "TOPLEFT" }, "confidence": 0.8971090316772461, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.341, "r_y0": 510.96292, "r_x1": 273.13342, "r_y1": 510.96292, "r_x2": 273.13342, "r_y2": 502.05637, "r_x3": 63.341, "r_y3": 502.05637, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "caption", "bbox": { "l": 308.862, "t": 306.59836, "r": 545.11511, "b": 327.45990000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.8773345351219177, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 315.50491, "r_x1": 345.63397, "r_y1": 315.50491, "r_x2": 345.63397, "r_y2": 306.59836, "r_x3": 308.862, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.78711, "r_y0": 315.50491, "r_x1": 545.11511, "r_y1": 315.50491, "r_x2": 545.11511, "r_y2": 306.59836, "r_x3": 352.78711, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 327.45990000000006, "r_x1": 355.89545, "r_y1": 327.45990000000006, "r_x2": 355.89545, "r_y2": 318.55334, "r_x3": 308.862, "r_y3": 318.55334, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "caption", "bbox": { "l": 312.34299, "t": 680.4933599999999, "r": 541.63232, "b": 689.39993, "coord_origin": "TOPLEFT" }, "confidence": 0.9188510179519653, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34299, "r_y0": 689.39993, "r_x1": 541.63232, "r_y1": 689.39993, "r_x2": 541.63232, "r_y2": 680.4933599999999, "r_x3": 312.34299, "r_y3": 680.4933599999999, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133358, "r": 302.59357, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.9020507335662842, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "table", "bbox": { "l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT" }, "confidence": 0.70481276512146, "cells": [], "children": [] }, { "id": 32, "label": "table", "bbox": { "l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT" }, "confidence": 0.564289927482605, "cells": [], "children": [] }, { "id": 9, "label": "table", "bbox": { "l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT" }, "confidence": 0.8857279419898987, "cells": [], "children": [] }, { "id": 21, "label": "table", "bbox": { "l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6602518558502197, "cells": [], "children": [] }, { "id": 4, "label": "table", "bbox": { "l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT" }, "confidence": 0.9155725836753845, "cells": [], "children": [] }, { "id": 19, "label": "picture", "bbox": { "l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT" }, "confidence": 0.6956620812416077, "cells": [], "children": [] }, { "id": 37, "label": "table", "bbox": { "l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT" }, "confidence": 0.52826988697052, "cells": [], "children": [] }, { "id": 6, "label": "table", "bbox": { "l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT" }, "confidence": 0.9085132479667664, "cells": [], "children": [] }, { "id": 12, "label": "table", "bbox": { "l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT" }, "confidence": 0.8486077189445496, "cells": [], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT" }, "confidence": 0.9613965749740601, "cells": [], "children": [] }, { "id": 10, "label": "table", "bbox": { "l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT" }, "confidence": 0.8815538287162781, "cells": [], "children": [] }, { "id": 5, "label": "table", "bbox": { "l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT" }, "confidence": 0.9096733927726746, "cells": [], "children": [] }, { "id": 13, "label": "picture", "bbox": { "l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT" }, "confidence": 0.8023569583892822, "cells": [], "children": [] }, { "id": 30, "label": "table", "bbox": { "l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT" }, "confidence": 0.5930293798446655, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "17": { "label": "table", "id": 17, "page_no": 12, "cluster": { "id": 17, "label": "table", "bbox": { "l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT" }, "confidence": 0.70481276512146, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "32": { "label": "table", "id": 32, "page_no": 12, "cluster": { "id": 32, "label": "table", "bbox": { "l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT" }, "confidence": 0.564289927482605, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "9": { "label": "table", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "table", "bbox": { "l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT" }, "confidence": 0.8857279419898987, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "21": { "label": "table", "id": 21, "page_no": 12, "cluster": { "id": 21, "label": "table", "bbox": { "l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6602518558502197, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "4": { "label": "table", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "table", "bbox": { "l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT" }, "confidence": 0.9155725836753845, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "37": { "label": "table", "id": 37, "page_no": 12, "cluster": { "id": 37, "label": "table", "bbox": { "l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT" }, "confidence": 0.52826988697052, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "6": { "label": "table", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "table", "bbox": { "l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT" }, "confidence": 0.9085132479667664, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "12": { "label": "table", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "table", "bbox": { "l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT" }, "confidence": 0.8486077189445496, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "0": { "label": "table", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "table", "bbox": { "l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT" }, "confidence": 0.9613965749740601, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "10": { "label": "table", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "table", "bbox": { "l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT" }, "confidence": 0.8815538287162781, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "5": { "label": "table", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "table", "bbox": { "l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT" }, "confidence": 0.9096733927726746, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "30": { "label": "table", "id": 30, "page_no": 12, "cluster": { "id": 30, "label": "table", "bbox": { "l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT" }, "confidence": 0.5930293798446655, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 88.846588, "b": 84.11492999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.7545598149299622, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 88.846588, "r_y1": 84.11492999999996, "r_x2": 88.846588, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "phan cell." }, { "label": "text", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.112, "t": 87.16339000000005, "r": 286.36496, "b": 108.02495999999985, "coord_origin": "TOPLEFT" }, "confidence": 0.9170762300491333, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.06994999999995, "r_x1": 286.36496, "r_y1": 96.06994999999995, "r_x2": 286.36496, "r_y2": 87.16339000000005, "r_x3": 62.067001, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 127.03322, "r_y1": 108.02495999999985, "r_x2": 127.03322, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9f. Otherwise create a new structural cell and match it wit the orphan cell." }, { "label": "text", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 111.16309000000001, "r": 286.36499, "b": 131.70587, "coord_origin": "TOPLEFT" }, "confidence": 0.9454683065414429, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 119.7508499999999, "r_x1": 286.36499, "r_y1": 119.7508499999999, "r_x2": 286.36499, "r_y2": 111.16309000000001, "r_x3": 62.067001, "r_y3": 111.16309000000001, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.70587, "r_x1": 234.06139999999996, "r_y1": 131.70587, "r_x2": 234.06139999999996, "r_y2": 123.11810000000003, "r_x3": 50.112, "r_y3": 123.11810000000003, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aditional images with examples of TableFormer predictions and post-processing can be found below." }, { "label": "caption", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 63.341, "t": 502.05637, "r": 273.13342, "b": 510.96292, "coord_origin": "TOPLEFT" }, "confidence": 0.8971090316772461, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.341, "r_y0": 510.96292, "r_x1": 273.13342, "r_y1": 510.96292, "r_x2": 273.13342, "r_y2": 502.05637, "r_x3": 63.341, "r_y3": 502.05637, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 8: Example of a table with multi-line header." }, { "label": "caption", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.862, "t": 306.59836, "r": 545.11511, "b": 327.45990000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.8773345351219177, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 315.50491, "r_x1": 345.63397, "r_y1": 315.50491, "r_x2": 345.63397, "r_y2": 306.59836, "r_x3": 308.862, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.78711, "r_y0": 315.50491, "r_x1": 545.11511, "r_y1": 315.50491, "r_x2": 545.11511, "r_y2": 306.59836, "r_x3": 352.78711, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 327.45990000000006, "r_x1": 355.89545, "r_y1": 327.45990000000006, "r_x2": 355.89545, "r_y2": 318.55334, "r_x3": 308.862, "r_y3": 318.55334, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 9: Example of a table with big empty distance between cells." }, { "label": "caption", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 312.34299, "t": 680.4933599999999, "r": 541.63232, "b": 689.39993, "coord_origin": "TOPLEFT" }, "confidence": 0.9188510179519653, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34299, "r_y0": 689.39993, "r_x1": 541.63232, "r_y1": 689.39993, "r_x2": 541.63232, "r_y2": 680.4933599999999, "r_x3": 312.34299, "r_y3": 680.4933599999999, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 10: Example of a complex table with empty cells." }, { "label": "page_footer", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133358, "r": 302.59357, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.9020507335662842, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" }, { "label": "table", "id": 17, "page_no": 12, "cluster": { "id": 17, "label": "table", "bbox": { "l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT" }, "confidence": 0.70481276512146, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 32, "page_no": 12, "cluster": { "id": 32, "label": "table", "bbox": { "l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT" }, "confidence": 0.564289927482605, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "table", "bbox": { "l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT" }, "confidence": 0.8857279419898987, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 21, "page_no": 12, "cluster": { "id": 21, "label": "table", "bbox": { "l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6602518558502197, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "table", "bbox": { "l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT" }, "confidence": 0.9155725836753845, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 19, "page_no": 12, "cluster": { "id": 19, "label": "picture", "bbox": { "l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT" }, "confidence": 0.6956620812416077, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 37, "page_no": 12, "cluster": { "id": 37, "label": "table", "bbox": { "l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT" }, "confidence": 0.52826988697052, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "table", "bbox": { "l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT" }, "confidence": 0.9085132479667664, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "table", "bbox": { "l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT" }, "confidence": 0.8486077189445496, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "table", "bbox": { "l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT" }, "confidence": 0.9613965749740601, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "table", "bbox": { "l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT" }, "confidence": 0.8815538287162781, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "table", "bbox": { "l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT" }, "confidence": 0.9096733927726746, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT" }, "confidence": 0.8023569583892822, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 30, "page_no": 12, "cluster": { "id": 30, "label": "table", "bbox": { "l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT" }, "confidence": 0.5930293798446655, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "body": [ { "label": "text", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.112, "t": 75.20836999999995, "r": 88.846588, "b": 84.11492999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.7545598149299622, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 84.11492999999996, "r_x1": 88.846588, "r_y1": 84.11492999999996, "r_x2": 88.846588, "r_y2": 75.20836999999995, "r_x3": 50.112, "r_y3": 75.20836999999995, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "phan cell." }, { "label": "text", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.112, "t": 87.16339000000005, "r": 286.36496, "b": 108.02495999999985, "coord_origin": "TOPLEFT" }, "confidence": 0.9170762300491333, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 96.06994999999995, "r_x1": 286.36496, "r_y1": 96.06994999999995, "r_x2": 286.36496, "r_y2": 87.16339000000005, "r_x3": 62.067001, "r_y3": 87.16339000000005, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 108.02495999999985, "r_x1": 127.03322, "r_y1": 108.02495999999985, "r_x2": 127.03322, "r_y2": 99.11841000000004, "r_x3": 50.112, "r_y3": 99.11841000000004, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9f. Otherwise create a new structural cell and match it wit the orphan cell." }, { "label": "text", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.112, "t": 111.16309000000001, "r": 286.36499, "b": 131.70587, "coord_origin": "TOPLEFT" }, "confidence": 0.9454683065414429, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.067001, "r_y0": 119.7508499999999, "r_x1": 286.36499, "r_y1": 119.7508499999999, "r_x2": 286.36499, "r_y2": 111.16309000000001, "r_x3": 62.067001, "r_y3": 111.16309000000001, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 131.70587, "r_x1": 234.06139999999996, "r_y1": 131.70587, "r_x2": 234.06139999999996, "r_y2": 123.11810000000003, "r_x3": 50.112, "r_y3": 123.11810000000003, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aditional images with examples of TableFormer predictions and post-processing can be found below." }, { "label": "caption", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 63.341, "t": 502.05637, "r": 273.13342, "b": 510.96292, "coord_origin": "TOPLEFT" }, "confidence": 0.8971090316772461, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.341, "r_y0": 510.96292, "r_x1": 273.13342, "r_y1": 510.96292, "r_x2": 273.13342, "r_y2": 502.05637, "r_x3": 63.341, "r_y3": 502.05637, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 8: Example of a table with multi-line header." }, { "label": "caption", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.862, "t": 306.59836, "r": 545.11511, "b": 327.45990000000006, "coord_origin": "TOPLEFT" }, "confidence": 0.8773345351219177, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 315.50491, "r_x1": 345.63397, "r_y1": 315.50491, "r_x2": 345.63397, "r_y2": 306.59836, "r_x3": 308.862, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.78711, "r_y0": 315.50491, "r_x1": 545.11511, "r_y1": 315.50491, "r_x2": 545.11511, "r_y2": 306.59836, "r_x3": 352.78711, "r_y3": 306.59836, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.862, "r_y0": 327.45990000000006, "r_x1": 355.89545, "r_y1": 327.45990000000006, "r_x2": 355.89545, "r_y2": 318.55334, "r_x3": 308.862, "r_y3": 318.55334, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 9: Example of a table with big empty distance between cells." }, { "label": "caption", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 312.34299, "t": 680.4933599999999, "r": 541.63232, "b": 689.39993, "coord_origin": "TOPLEFT" }, "confidence": 0.9188510179519653, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34299, "r_y0": 689.39993, "r_x1": 541.63232, "r_y1": 689.39993, "r_x2": 541.63232, "r_y2": 680.4933599999999, "r_x3": 312.34299, "r_y3": 680.4933599999999, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 10: Example of a complex table with empty cells." }, { "label": "table", "id": 17, "page_no": 12, "cluster": { "id": 17, "label": "table", "bbox": { "l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT" }, "confidence": 0.70481276512146, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 32, "page_no": 12, "cluster": { "id": 32, "label": "table", "bbox": { "l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT" }, "confidence": 0.564289927482605, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "table", "bbox": { "l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT" }, "confidence": 0.8857279419898987, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 21, "page_no": 12, "cluster": { "id": 21, "label": "table", "bbox": { "l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6602518558502197, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "table", "bbox": { "l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT" }, "confidence": 0.9155725836753845, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 19, "page_no": 12, "cluster": { "id": 19, "label": "picture", "bbox": { "l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT" }, "confidence": 0.6956620812416077, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 37, "page_no": 12, "cluster": { "id": 37, "label": "table", "bbox": { "l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT" }, "confidence": 0.52826988697052, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "table", "bbox": { "l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT" }, "confidence": 0.9085132479667664, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "table", "bbox": { "l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT" }, "confidence": 0.8486077189445496, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "table", "bbox": { "l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT" }, "confidence": 0.9613965749740601, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "table", "bbox": { "l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT" }, "confidence": 0.8815538287162781, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "table", "bbox": { "l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT" }, "confidence": 0.9096733927726746, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT" }, "confidence": 0.8023569583892822, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 30, "page_no": 12, "cluster": { "id": 30, "label": "table", "bbox": { "l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT" }, "confidence": 0.5930293798446655, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "headers": [ { "label": "page_footer", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133358, "r": 302.59357, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.9020507335662842, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" } ] } }, { "page_no": 13, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.67691, "r_x1": 93.050797, "r_y1": 365.67691, "r_x2": 93.050797, "r_y2": 356.77036, "r_x3": 50.112, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73071, "r_y0": 365.67691, "r_x1": 286.36508, "r_y1": 365.67691, "r_x2": 286.36508, "r_y2": 356.77036, "r_x3": 103.73071, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 377.6319, "r_x1": 70.864098, "r_y1": 377.6319, "r_x2": 70.864098, "r_y2": 368.72534, "r_x3": 50.112, "r_y3": 368.72534, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.618998999999995, "r_y0": 680.72492, "r_x1": 281.8559, "r_y1": 680.72492, "r_x2": 281.8559, "r_y2": 671.81836, "r_x3": 54.618998999999995, "r_y3": 671.81836, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79001, "r_y0": 380.59091, "r_x1": 538.18524, "r_y1": 380.59091, "r_x2": 538.18524, "r_y2": 371.68436, "r_x3": 315.79001, "r_y3": 371.68436, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98499, "r_y0": 692.452927, "r_x1": 508.98935000000006, "r_y1": 692.452927, "r_x2": 508.98935000000006, "r_y2": 683.54636, "r_x3": 344.98499, "r_y3": 683.54636, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039925, "r_x1": 302.59357, "r_y1": 743.039925, "r_x2": 302.59357, "r_y2": 734.133362, "r_x3": 292.63098, "r_y3": 734.133362, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "caption", "bbox": { "l": 50.112, "t": 356.77036, "r": 286.36508, "b": 377.6319, "coord_origin": "TOPLEFT" }, "confidence": 0.951069176197052, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.67691, "r_x1": 93.050797, "r_y1": 365.67691, "r_x2": 93.050797, "r_y2": 356.77036, "r_x3": 50.112, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73071, "r_y0": 365.67691, "r_x1": 286.36508, "r_y1": 365.67691, "r_x2": 286.36508, "r_y2": 356.77036, "r_x3": 103.73071, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 377.6319, "r_x1": 70.864098, "r_y1": 377.6319, "r_x2": 70.864098, "r_y2": 368.72534, "r_x3": 50.112, "r_y3": 368.72534, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "caption", "bbox": { "l": 54.618998999999995, "t": 671.81836, "r": 281.8559, "b": 680.72492, "coord_origin": "TOPLEFT" }, "confidence": 0.926384687423706, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.618998999999995, "r_y0": 680.72492, "r_x1": 281.8559, "r_y1": 680.72492, "r_x2": 281.8559, "r_y2": 671.81836, "r_x3": 54.618998999999995, "r_y3": 671.81836, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "caption", "bbox": { "l": 315.79001, "t": 371.68436, "r": 538.18524, "b": 380.59091, "coord_origin": "TOPLEFT" }, "confidence": 0.9178510904312134, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79001, "r_y0": 380.59091, "r_x1": 538.18524, "r_y1": 380.59091, "r_x2": 538.18524, "r_y2": 371.68436, "r_x3": 315.79001, "r_y3": 371.68436, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "caption", "bbox": { "l": 344.98499, "t": 683.54636, "r": 508.98935000000006, "b": 692.452927, "coord_origin": "TOPLEFT" }, "confidence": 0.9191023111343384, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98499, "r_y0": 692.452927, "r_x1": 508.98935000000006, "r_y1": 692.452927, "r_x2": 508.98935000000006, "r_y2": 683.54636, "r_x3": 344.98499, "r_y3": 683.54636, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133362, "r": 302.59357, "b": 743.039925, "coord_origin": "TOPLEFT" }, "confidence": 0.887715220451355, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039925, "r_x1": 302.59357, "r_y1": 743.039925, "r_x2": 302.59357, "r_y2": 734.133362, "r_x3": 292.63098, "r_y3": 734.133362, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "picture", "bbox": { "l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT" }, "confidence": 0.5003598928451538, "cells": [], "children": [] }, { "id": 30, "label": "picture", "bbox": { "l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT" }, "confidence": 0.5613773465156555, "cells": [], "children": [] }, { "id": 23, "label": "table", "bbox": { "l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT" }, "confidence": 0.6235634684562683, "cells": [], "children": [] }, { "id": 33, "label": "table", "bbox": { "l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT" }, "confidence": 0.5502500534057617, "cells": [], "children": [] }, { "id": 27, "label": "table", "bbox": { "l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT" }, "confidence": 0.5696635246276855, "cells": [], "children": [] }, { "id": 38, "label": "table", "bbox": { "l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT" }, "confidence": 0.5227423310279846, "cells": [], "children": [] }, { "id": 10, "label": "table", "bbox": { "l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT" }, "confidence": 0.8384715914726257, "cells": [], "children": [] }, { "id": 9, "label": "table", "bbox": { "l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT" }, "confidence": 0.8418155908584595, "cells": [], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8502867221832275, "cells": [], "children": [] }, { "id": 4, "label": "table", "bbox": { "l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT" }, "confidence": 0.8922696709632874, "cells": [], "children": [] }, { "id": 15, "label": "table", "bbox": { "l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT" }, "confidence": 0.6817973256111145, "cells": [], "children": [] }, { "id": 6, "label": "table", "bbox": { "l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT" }, "confidence": 0.88722163438797, "cells": [], "children": [] }, { "id": 7, "label": "table", "bbox": { "l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT" }, "confidence": 0.8717735409736633, "cells": [], "children": [] }, { "id": 11, "label": "picture", "bbox": { "l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT" }, "confidence": 0.7871124744415283, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "23": { "label": "table", "id": 23, "page_no": 13, "cluster": { "id": 23, "label": "table", "bbox": { "l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT" }, "confidence": 0.6235634684562683, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "33": { "label": "table", "id": 33, "page_no": 13, "cluster": { "id": 33, "label": "table", "bbox": { "l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT" }, "confidence": 0.5502500534057617, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "27": { "label": "table", "id": 27, "page_no": 13, "cluster": { "id": 27, "label": "table", "bbox": { "l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT" }, "confidence": 0.5696635246276855, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "38": { "label": "table", "id": 38, "page_no": 13, "cluster": { "id": 38, "label": "table", "bbox": { "l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT" }, "confidence": 0.5227423310279846, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "10": { "label": "table", "id": 10, "page_no": 13, "cluster": { "id": 10, "label": "table", "bbox": { "l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT" }, "confidence": 0.8384715914726257, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "9": { "label": "table", "id": 9, "page_no": 13, "cluster": { "id": 9, "label": "table", "bbox": { "l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT" }, "confidence": 0.8418155908584595, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "8": { "label": "table", "id": 8, "page_no": 13, "cluster": { "id": 8, "label": "table", "bbox": { "l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8502867221832275, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "4": { "label": "table", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "table", "bbox": { "l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT" }, "confidence": 0.8922696709632874, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "15": { "label": "table", "id": 15, "page_no": 13, "cluster": { "id": 15, "label": "table", "bbox": { "l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT" }, "confidence": 0.6817973256111145, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "6": { "label": "table", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "table", "bbox": { "l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT" }, "confidence": 0.88722163438797, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "7": { "label": "table", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "table", "bbox": { "l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT" }, "confidence": 0.8717735409736633, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.112, "t": 356.77036, "r": 286.36508, "b": 377.6319, "coord_origin": "TOPLEFT" }, "confidence": 0.951069176197052, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.67691, "r_x1": 93.050797, "r_y1": 365.67691, "r_x2": 93.050797, "r_y2": 356.77036, "r_x3": 50.112, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73071, "r_y0": 365.67691, "r_x1": 286.36508, "r_y1": 365.67691, "r_x2": 286.36508, "r_y2": 356.77036, "r_x3": 103.73071, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 377.6319, "r_x1": 70.864098, "r_y1": 377.6319, "r_x2": 70.864098, "r_y2": 368.72534, "r_x3": 50.112, "r_y3": 368.72534, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 11: Simple table with different style and empty cells." }, { "label": "caption", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 54.618998999999995, "t": 671.81836, "r": 281.8559, "b": 680.72492, "coord_origin": "TOPLEFT" }, "confidence": 0.926384687423706, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.618998999999995, "r_y0": 680.72492, "r_x1": 281.8559, "r_y1": 680.72492, "r_x2": 281.8559, "r_y2": 671.81836, "r_x3": 54.618998999999995, "r_y3": 671.81836, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 12: Simple table predictions and post processing." }, { "label": "caption", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "caption", "bbox": { "l": 315.79001, "t": 371.68436, "r": 538.18524, "b": 380.59091, "coord_origin": "TOPLEFT" }, "confidence": 0.9178510904312134, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79001, "r_y0": 380.59091, "r_x1": 538.18524, "r_y1": 380.59091, "r_x2": 538.18524, "r_y2": 371.68436, "r_x3": 315.79001, "r_y3": 371.68436, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 13: Table predictions example on colorful table." }, { "label": "caption", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 344.98499, "t": 683.54636, "r": 508.98935000000006, "b": 692.452927, "coord_origin": "TOPLEFT" }, "confidence": 0.9191023111343384, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98499, "r_y0": 692.452927, "r_x1": 508.98935000000006, "r_y1": 692.452927, "r_x2": 508.98935000000006, "r_y2": 683.54636, "r_x3": 344.98499, "r_y3": 683.54636, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 14: Example with multi-line text." }, { "label": "page_footer", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133362, "r": 302.59357, "b": 743.039925, "coord_origin": "TOPLEFT" }, "confidence": 0.887715220451355, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039925, "r_x1": 302.59357, "r_y1": 743.039925, "r_x2": 302.59357, "r_y2": 734.133362, "r_x3": 292.63098, "r_y3": 734.133362, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "picture", "id": 41, "page_no": 13, "cluster": { "id": 41, "label": "picture", "bbox": { "l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT" }, "confidence": 0.5003598928451538, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 30, "page_no": 13, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT" }, "confidence": 0.5613773465156555, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 23, "page_no": 13, "cluster": { "id": 23, "label": "table", "bbox": { "l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT" }, "confidence": 0.6235634684562683, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 33, "page_no": 13, "cluster": { "id": 33, "label": "table", "bbox": { "l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT" }, "confidence": 0.5502500534057617, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 27, "page_no": 13, "cluster": { "id": 27, "label": "table", "bbox": { "l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT" }, "confidence": 0.5696635246276855, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 38, "page_no": 13, "cluster": { "id": 38, "label": "table", "bbox": { "l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT" }, "confidence": 0.5227423310279846, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 13, "cluster": { "id": 10, "label": "table", "bbox": { "l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT" }, "confidence": 0.8384715914726257, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 13, "cluster": { "id": 9, "label": "table", "bbox": { "l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT" }, "confidence": 0.8418155908584595, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 8, "page_no": 13, "cluster": { "id": 8, "label": "table", "bbox": { "l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8502867221832275, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "table", "bbox": { "l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT" }, "confidence": 0.8922696709632874, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 15, "page_no": 13, "cluster": { "id": 15, "label": "table", "bbox": { "l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT" }, "confidence": 0.6817973256111145, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "table", "bbox": { "l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT" }, "confidence": 0.88722163438797, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "table", "bbox": { "l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT" }, "confidence": 0.8717735409736633, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 11, "page_no": 13, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT" }, "confidence": 0.7871124744415283, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.112, "t": 356.77036, "r": 286.36508, "b": 377.6319, "coord_origin": "TOPLEFT" }, "confidence": 0.951069176197052, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 365.67691, "r_x1": 93.050797, "r_y1": 365.67691, "r_x2": 93.050797, "r_y2": 356.77036, "r_x3": 50.112, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73071, "r_y0": 365.67691, "r_x1": 286.36508, "r_y1": 365.67691, "r_x2": 286.36508, "r_y2": 356.77036, "r_x3": 103.73071, "r_y3": 356.77036, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 377.6319, "r_x1": 70.864098, "r_y1": 377.6319, "r_x2": 70.864098, "r_y2": 368.72534, "r_x3": 50.112, "r_y3": 368.72534, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 11: Simple table with different style and empty cells." }, { "label": "caption", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 54.618998999999995, "t": 671.81836, "r": 281.8559, "b": 680.72492, "coord_origin": "TOPLEFT" }, "confidence": 0.926384687423706, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.618998999999995, "r_y0": 680.72492, "r_x1": 281.8559, "r_y1": 680.72492, "r_x2": 281.8559, "r_y2": 671.81836, "r_x3": 54.618998999999995, "r_y3": 671.81836, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 12: Simple table predictions and post processing." }, { "label": "caption", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "caption", "bbox": { "l": 315.79001, "t": 371.68436, "r": 538.18524, "b": 380.59091, "coord_origin": "TOPLEFT" }, "confidence": 0.9178510904312134, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79001, "r_y0": 380.59091, "r_x1": 538.18524, "r_y1": 380.59091, "r_x2": 538.18524, "r_y2": 371.68436, "r_x3": 315.79001, "r_y3": 371.68436, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 13: Table predictions example on colorful table." }, { "label": "caption", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 344.98499, "t": 683.54636, "r": 508.98935000000006, "b": 692.452927, "coord_origin": "TOPLEFT" }, "confidence": 0.9191023111343384, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98499, "r_y0": 692.452927, "r_x1": 508.98935000000006, "r_y1": 692.452927, "r_x2": 508.98935000000006, "r_y2": 683.54636, "r_x3": 344.98499, "r_y3": 683.54636, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 14: Example with multi-line text." }, { "label": "picture", "id": 41, "page_no": 13, "cluster": { "id": 41, "label": "picture", "bbox": { "l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT" }, "confidence": 0.5003598928451538, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 30, "page_no": 13, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT" }, "confidence": 0.5613773465156555, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 23, "page_no": 13, "cluster": { "id": 23, "label": "table", "bbox": { "l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT" }, "confidence": 0.6235634684562683, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 33, "page_no": 13, "cluster": { "id": 33, "label": "table", "bbox": { "l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT" }, "confidence": 0.5502500534057617, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 27, "page_no": 13, "cluster": { "id": 27, "label": "table", "bbox": { "l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT" }, "confidence": 0.5696635246276855, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 38, "page_no": 13, "cluster": { "id": 38, "label": "table", "bbox": { "l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT" }, "confidence": 0.5227423310279846, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 13, "cluster": { "id": 10, "label": "table", "bbox": { "l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT" }, "confidence": 0.8384715914726257, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 13, "cluster": { "id": 9, "label": "table", "bbox": { "l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT" }, "confidence": 0.8418155908584595, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 8, "page_no": 13, "cluster": { "id": 8, "label": "table", "bbox": { "l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT" }, "confidence": 0.8502867221832275, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "table", "bbox": { "l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT" }, "confidence": 0.8922696709632874, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 15, "page_no": 13, "cluster": { "id": 15, "label": "table", "bbox": { "l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT" }, "confidence": 0.6817973256111145, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "table", "bbox": { "l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT" }, "confidence": 0.88722163438797, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "table", "bbox": { "l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT" }, "confidence": 0.8717735409736633, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 11, "page_no": 13, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT" }, "confidence": 0.7871124744415283, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_footer", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133362, "r": 302.59357, "b": 743.039925, "coord_origin": "TOPLEFT" }, "confidence": 0.887715220451355, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039925, "r_x1": 302.59357, "r_y1": 743.039925, "r_x2": 302.59357, "r_y2": 734.133362, "r_x3": 292.63098, "r_y3": 734.133362, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" } ] } }, { "page_no": 14, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.233002, "r_y0": 653.25793, "r_x1": 252.24225, "r_y1": 653.25793, "r_x2": 252.24225, "r_y2": 644.3513800000001, "r_x3": 84.233002, "r_y3": 644.3513800000001, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 661.8419, "r_x1": 545.11511, "r_y1": 661.8419, "r_x2": 545.11511, "r_y2": 652.93535, "r_x3": 308.86197, "r_y3": 652.93535, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 673.79691, "r_x1": 497.60349, "r_y1": 673.79691, "r_x2": 497.60349, "r_y2": 664.89035, "r_x3": 308.86197, "r_y3": 664.89035, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039906, "r_x1": 302.59357, "r_y1": 743.039906, "r_x2": 302.59357, "r_y2": 734.133343, "r_x3": 292.63098, "r_y3": 734.133343, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "caption", "bbox": { "l": 84.233002, "t": 644.3513800000001, "r": 252.24225, "b": 653.25793, "coord_origin": "TOPLEFT" }, "confidence": 0.9257225394248962, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.233002, "r_y0": 653.25793, "r_x1": 252.24225, "r_y1": 653.25793, "r_x2": 252.24225, "r_y2": 644.3513800000001, "r_x3": 84.233002, "r_y3": 644.3513800000001, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "caption", "bbox": { "l": 308.86197, "t": 652.93535, "r": 545.11511, "b": 673.79691, "coord_origin": "TOPLEFT" }, "confidence": 0.9134758710861206, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 661.8419, "r_x1": 545.11511, "r_y1": 661.8419, "r_x2": 545.11511, "r_y2": 652.93535, "r_x3": 308.86197, "r_y3": 652.93535, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 673.79691, "r_x1": 497.60349, "r_y1": 673.79691, "r_x2": 497.60349, "r_y2": 664.89035, "r_x3": 308.86197, "r_y3": 664.89035, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133343, "r": 302.59357, "b": 743.039906, "coord_origin": "TOPLEFT" }, "confidence": 0.9037020802497864, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039906, "r_x1": 302.59357, "r_y1": 743.039906, "r_x2": 302.59357, "r_y2": 734.133343, "r_x3": 292.63098, "r_y3": 734.133343, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "table", "bbox": { "l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT" }, "confidence": 0.8569068908691406, "cells": [], "children": [] }, { "id": 6, "label": "picture", "bbox": { "l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT" }, "confidence": 0.8099280595779419, "cells": [], "children": [] }, { "id": 19, "label": "table", "bbox": { "l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT" }, "confidence": 0.5584819912910461, "cells": [], "children": [] }, { "id": 2, "label": "table", "bbox": { "l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT" }, "confidence": 0.9060239195823669, "cells": [], "children": [] }, { "id": 18, "label": "picture", "bbox": { "l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT" }, "confidence": 0.567050039768219, "cells": [], "children": [] }, { "id": 10, "label": "table", "bbox": { "l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT" }, "confidence": 0.7748245000839233, "cells": [], "children": [] }, { "id": 20, "label": "picture", "bbox": { "l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT" }, "confidence": 0.5515198707580566, "cells": [], "children": [] }, { "id": 9, "label": "table", "bbox": { "l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT" }, "confidence": 0.7755160927772522, "cells": [], "children": [] }, { "id": 5, "label": "picture", "bbox": { "l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT" }, "confidence": 0.8410326838493347, "cells": [], "children": [] }, { "id": 22, "label": "picture", "bbox": { "l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT" }, "confidence": 0.5478786826133728, "cells": [], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT" }, "confidence": 0.7805566787719727, "cells": [], "children": [] }, { "id": 7, "label": "picture", "bbox": { "l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.8057592511177063, "cells": [], "children": [] }, { "id": 11, "label": "table", "bbox": { "l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6835257411003113, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "4": { "label": "table", "id": 4, "page_no": 14, "cluster": { "id": 4, "label": "table", "bbox": { "l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT" }, "confidence": 0.8569068908691406, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "19": { "label": "table", "id": 19, "page_no": 14, "cluster": { "id": 19, "label": "table", "bbox": { "l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT" }, "confidence": 0.5584819912910461, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "2": { "label": "table", "id": 2, "page_no": 14, "cluster": { "id": 2, "label": "table", "bbox": { "l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT" }, "confidence": 0.9060239195823669, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "10": { "label": "table", "id": 10, "page_no": 14, "cluster": { "id": 10, "label": "table", "bbox": { "l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT" }, "confidence": 0.7748245000839233, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "9": { "label": "table", "id": 9, "page_no": 14, "cluster": { "id": 9, "label": "table", "bbox": { "l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT" }, "confidence": 0.7755160927772522, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "8": { "label": "table", "id": 8, "page_no": 14, "cluster": { "id": 8, "label": "table", "bbox": { "l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT" }, "confidence": 0.7805566787719727, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "11": { "label": "table", "id": 11, "page_no": 14, "cluster": { "id": 11, "label": "table", "bbox": { "l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6835257411003113, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 0, "page_no": 14, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 84.233002, "t": 644.3513800000001, "r": 252.24225, "b": 653.25793, "coord_origin": "TOPLEFT" }, "confidence": 0.9257225394248962, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.233002, "r_y0": 653.25793, "r_x1": 252.24225, "r_y1": 653.25793, "r_x2": 252.24225, "r_y2": 644.3513800000001, "r_x3": 84.233002, "r_y3": 644.3513800000001, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 15: Example with triangular table." }, { "label": "caption", "id": 1, "page_no": 14, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 308.86197, "t": 652.93535, "r": 545.11511, "b": 673.79691, "coord_origin": "TOPLEFT" }, "confidence": 0.9134758710861206, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 661.8419, "r_x1": 545.11511, "r_y1": 661.8419, "r_x2": 545.11511, "r_y2": 652.93535, "r_x3": 308.86197, "r_y3": 652.93535, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 673.79691, "r_x1": 497.60349, "r_y1": 673.79691, "r_x2": 497.60349, "r_y2": 664.89035, "r_x3": 308.86197, "r_y3": 664.89035, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact." }, { "label": "page_footer", "id": 3, "page_no": 14, "cluster": { "id": 3, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133343, "r": 302.59357, "b": 743.039906, "coord_origin": "TOPLEFT" }, "confidence": 0.9037020802497864, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039906, "r_x1": 302.59357, "r_y1": 743.039906, "r_x2": 302.59357, "r_y2": 734.133343, "r_x3": 292.63098, "r_y3": 734.133343, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15" }, { "label": "table", "id": 4, "page_no": 14, "cluster": { "id": 4, "label": "table", "bbox": { "l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT" }, "confidence": 0.8569068908691406, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 6, "page_no": 14, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT" }, "confidence": 0.8099280595779419, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 19, "page_no": 14, "cluster": { "id": 19, "label": "table", "bbox": { "l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT" }, "confidence": 0.5584819912910461, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 2, "page_no": 14, "cluster": { "id": 2, "label": "table", "bbox": { "l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT" }, "confidence": 0.9060239195823669, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 18, "page_no": 14, "cluster": { "id": 18, "label": "picture", "bbox": { "l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT" }, "confidence": 0.567050039768219, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 10, "page_no": 14, "cluster": { "id": 10, "label": "table", "bbox": { "l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT" }, "confidence": 0.7748245000839233, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 20, "page_no": 14, "cluster": { "id": 20, "label": "picture", "bbox": { "l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT" }, "confidence": 0.5515198707580566, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 9, "page_no": 14, "cluster": { "id": 9, "label": "table", "bbox": { "l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT" }, "confidence": 0.7755160927772522, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 5, "page_no": 14, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT" }, "confidence": 0.8410326838493347, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 22, "page_no": 14, "cluster": { "id": 22, "label": "picture", "bbox": { "l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT" }, "confidence": 0.5478786826133728, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 8, "page_no": 14, "cluster": { "id": 8, "label": "table", "bbox": { "l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT" }, "confidence": 0.7805566787719727, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 7, "page_no": 14, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.8057592511177063, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 14, "cluster": { "id": 11, "label": "table", "bbox": { "l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6835257411003113, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "body": [ { "label": "caption", "id": 0, "page_no": 14, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 84.233002, "t": 644.3513800000001, "r": 252.24225, "b": 653.25793, "coord_origin": "TOPLEFT" }, "confidence": 0.9257225394248962, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.233002, "r_y0": 653.25793, "r_x1": 252.24225, "r_y1": 653.25793, "r_x2": 252.24225, "r_y2": 644.3513800000001, "r_x3": 84.233002, "r_y3": 644.3513800000001, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 15: Example with triangular table." }, { "label": "caption", "id": 1, "page_no": 14, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 308.86197, "t": 652.93535, "r": 545.11511, "b": 673.79691, "coord_origin": "TOPLEFT" }, "confidence": 0.9134758710861206, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 661.8419, "r_x1": 545.11511, "r_y1": 661.8419, "r_x2": 545.11511, "r_y2": 652.93535, "r_x3": 308.86197, "r_y3": 652.93535, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86197, "r_y0": 673.79691, "r_x1": 497.60349, "r_y1": 673.79691, "r_x2": 497.60349, "r_y2": 664.89035, "r_x3": 308.86197, "r_y3": 664.89035, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact." }, { "label": "table", "id": 4, "page_no": 14, "cluster": { "id": 4, "label": "table", "bbox": { "l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT" }, "confidence": 0.8569068908691406, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 6, "page_no": 14, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT" }, "confidence": 0.8099280595779419, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 19, "page_no": 14, "cluster": { "id": 19, "label": "table", "bbox": { "l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT" }, "confidence": 0.5584819912910461, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 2, "page_no": 14, "cluster": { "id": 2, "label": "table", "bbox": { "l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT" }, "confidence": 0.9060239195823669, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 18, "page_no": 14, "cluster": { "id": 18, "label": "picture", "bbox": { "l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT" }, "confidence": 0.567050039768219, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 10, "page_no": 14, "cluster": { "id": 10, "label": "table", "bbox": { "l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT" }, "confidence": 0.7748245000839233, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 20, "page_no": 14, "cluster": { "id": 20, "label": "picture", "bbox": { "l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT" }, "confidence": 0.5515198707580566, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 9, "page_no": 14, "cluster": { "id": 9, "label": "table", "bbox": { "l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT" }, "confidence": 0.7755160927772522, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 5, "page_no": 14, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT" }, "confidence": 0.8410326838493347, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 22, "page_no": 14, "cluster": { "id": 22, "label": "picture", "bbox": { "l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT" }, "confidence": 0.5478786826133728, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 8, "page_no": 14, "cluster": { "id": 8, "label": "table", "bbox": { "l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT" }, "confidence": 0.7805566787719727, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 7, "page_no": 14, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.8057592511177063, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 14, "cluster": { "id": 11, "label": "table", "bbox": { "l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT" }, "confidence": 0.6835257411003113, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "headers": [ { "label": "page_footer", "id": 3, "page_no": 14, "cluster": { "id": 3, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133343, "r": 302.59357, "b": 743.039906, "coord_origin": "TOPLEFT" }, "confidence": 0.9037020802497864, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039906, "r_x1": 302.59357, "r_y1": 743.039906, "r_x2": 302.59357, "r_y2": 734.133343, "r_x3": 292.63098, "r_y3": 734.133343, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15" } ] } }, { "page_no": 15, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 517.24393, "r_x1": 545.11383, "r_y1": 517.24393, "r_x2": 545.11383, "r_y2": 508.33737, "r_x3": 50.112, "r_y3": 508.33737, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 529.1989100000001, "r_x1": 173.23975, "r_y1": 529.1989100000001, "r_x2": 173.23975, "r_y2": 520.2923599999999, "r_x3": 50.112, "r_y3": 520.2923599999999, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "caption", "bbox": { "l": 50.112, "t": 508.33737, "r": 545.11383, "b": 529.1989100000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9624594449996948, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 517.24393, "r_x1": 545.11383, "r_y1": 517.24393, "r_x2": 545.11383, "r_y2": 508.33737, "r_x3": 50.112, "r_y3": 508.33737, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 529.1989100000001, "r_x1": 173.23975, "r_y1": 529.1989100000001, "r_x2": 173.23975, "r_y2": 520.2923599999999, "r_x3": 50.112, "r_y3": 520.2923599999999, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133358, "r": 302.59357, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.9134101271629333, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "picture", "bbox": { "l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT" }, "confidence": 0.6913455724716187, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 0, "page_no": 15, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.112, "t": 508.33737, "r": 545.11383, "b": 529.1989100000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9624594449996948, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 517.24393, "r_x1": 545.11383, "r_y1": 517.24393, "r_x2": 545.11383, "r_y2": 508.33737, "r_x3": 50.112, "r_y3": 508.33737, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 529.1989100000001, "r_x1": 173.23975, "r_y1": 529.1989100000001, "r_x2": 173.23975, "r_y2": 520.2923599999999, "r_x3": 50.112, "r_y3": 520.2923599999999, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure." }, { "label": "page_footer", "id": 1, "page_no": 15, "cluster": { "id": 1, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133358, "r": 302.59357, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.9134101271629333, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16" }, { "label": "picture", "id": 2, "page_no": 15, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT" }, "confidence": 0.6913455724716187, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 0, "page_no": 15, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.112, "t": 508.33737, "r": 545.11383, "b": 529.1989100000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9624594449996948, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 517.24393, "r_x1": 545.11383, "r_y1": 517.24393, "r_x2": 545.11383, "r_y2": 508.33737, "r_x3": 50.112, "r_y3": 508.33737, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.112, "r_y0": 529.1989100000001, "r_x1": 173.23975, "r_y1": 529.1989100000001, "r_x2": 173.23975, "r_y2": 520.2923599999999, "r_x3": 50.112, "r_y3": 520.2923599999999, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure." }, { "label": "picture", "id": 2, "page_no": 15, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT" }, "confidence": 0.6913455724716187, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_footer", "id": 1, "page_no": 15, "cluster": { "id": 1, "label": "page_footer", "bbox": { "l": 292.63098, "t": 734.133358, "r": 302.59357, "b": 743.039921, "coord_origin": "TOPLEFT" }, "confidence": 0.9134101271629333, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63098, "r_y0": 743.039921, "r_x1": 302.59357, "r_y1": 743.039921, "r_x2": 302.59357, "r_y2": 734.133358, "r_x3": 292.63098, "r_y3": 734.133358, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16" } ] } } ]